avcut.c

/*
 * avcut
 *
 *  Copyright (C) 2015 Mario Kicherer (dev@kicherer.org)
 *
 * This program is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
 *
 */

#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <float.h>
#include <sys/stat.h>

#include <libavformat/avformat.h>
#include <libavcodec/avcodec.h>

#define AVCUT_DUMP_CHAR(var, length) { size_t i; for (i=0; i<(length); i++) { printf("%x ", ((char*) (var))[i]); } printf("\n"); }

#if LIBAVCODEC_VERSION_INT < AV_VERSION_INT(55,28,1)
#define av_frame_alloc avcodec_alloc_frame
#define av_frame_free avcodec_free_frame
#endif

// buffer management struct for a stream
struct packet_buffer {
	unsigned int stream_index;
	char stop_reading_stream; // do we have all required packets for this stream?
	
	AVPacket *pkts;
	size_t n_pkts; // number of pkts in .pkts
	
	AVFrame **frames;
	size_t n_frames; // number of frames in .frames
	
	size_t length; // allocated array length of .pkts and .frames
	
	unsigned long duration_dropped_pkts; // accumulated duration of dropped packets
	
	double next_dts; // DTS of the next packet that will be written
	long last_pts; // store last PTS in case we're dealing with AVIs where the
				// last two frames may have a zero DTS
};

// project state context
struct project {
	AVFormatContext *in_fctx;
	AVFormatContext *out_fctx;
	char has_b_frames;
	
	unsigned int n_stream_ids; // number of streams in output file
	unsigned int *stream_ids; // mapping of output stream to input stream
	
	double *cuts; // [ first_excluded_frame, first_included_frame, ...]
	size_t n_cuts;
	
	double stop_after_ts; // stop after this timestamp
	char stop_reading; // signal to stop reading new packets
	char last_flush;
	
	size_t video_packets_read;
	size_t other_packets_read;
	size_t video_packets_decoded;
	size_t video_frames_encoded;
	size_t video_packets_written;
	size_t other_packets_written;
	
	AVBitStreamFilterContext *bsf_h264_to_annexb;
	AVBitStreamFilterContext *bsf_dump_extra;
};

// private data avcut may store with each AVCodecContext
struct codeccontext {
	char h264_avcc_format; // flag: h264 stream with annexb = 0, or avcc = 1
};


#if (LIBAVCODEC_VERSION_MAJOR < 55) || \
	( (LIBAVCODEC_VERSION_MAJOR == 55) && (LIBAVCODEC_VERSION_MINOR < 55) )
// backported function to fix compilation with versions < v2.3
void av_packet_rescale_ts(AVPacket *pkt, AVRational src_tb, AVRational dst_tb)
{
	if (pkt->pts != AV_NOPTS_VALUE)
		pkt->pts = av_rescale_q(pkt->pts, src_tb, dst_tb);
	if (pkt->dts != AV_NOPTS_VALUE)
		pkt->dts = av_rescale_q(pkt->dts, src_tb, dst_tb);
	if (pkt->duration > 0)
		pkt->duration = av_rescale_q(pkt->duration, src_tb, dst_tb);
	#if FF_API_CONVERGENCE_DURATION
	FF_DISABLE_DEPRECATION_WARNINGS
	if (pkt->convergence_duration > 0)
		pkt->convergence_duration = av_rescale_q(pkt->convergence_duration, src_tb, dst_tb);
	FF_ENABLE_DEPRECATION_WARNINGS
	#endif
}
#endif

// encode a frame and write the resulting packet into the output file
int encode_write_frame(struct project *pr, struct packet_buffer *s, AVFrame *frame, int *got_frame_p) {
	AVPacket enc_pkt = { .data = NULL, .size = 0 };
	int got_frame, ret;
	AVStream *ostream = pr->out_fctx->streams[s->stream_index];
	
	
	if (frame)
		av_log(NULL, AV_LOG_DEBUG, "enc frame pts: %" PRId64 " pkt_pts: %" PRId64 " pkt_dts: %" PRId64 " pkt_size: %d type: %c to %f\n",
			frame->pts, frame->pkt_pts, frame->pkt_dts, frame->pkt_size, av_get_picture_type_char(frame->pict_type),
			frame->pts * av_q2d(ostream->codec->time_base)
			);
	
	av_init_packet(&enc_pkt);
	
	ret = avcodec_encode_video2(ostream->codec, &enc_pkt, frame, &got_frame);
	if (ret < 0) {
		av_log(NULL, AV_LOG_ERROR, "error while encoding frame, error %d\n", ret);
		return ret;
	}
	
	if (got_frame) {
		pr->video_frames_encoded++;
		
		enc_pkt.stream_index = s->stream_index;
		if (enc_pkt.duration == 0)
			enc_pkt.duration = ostream->codec->ticks_per_frame;
		
		av_packet_rescale_ts(&enc_pkt, ostream->codec->time_base, ostream->time_base);
		
		enc_pkt.dts = s->next_dts;
		s->next_dts += enc_pkt.duration;
		
		// copy the header to the beginning of each key frame if we use a global header
		if (ostream->codec->flags & CODEC_FLAG_GLOBAL_HEADER)
			av_bitstream_filter_filter(pr->bsf_dump_extra, ostream->codec, NULL,
				&enc_pkt.data, &enc_pkt.size, enc_pkt.data, enc_pkt.size,
				enc_pkt.flags & AV_PKT_FLAG_KEY);
		
		av_log(NULL, AV_LOG_DEBUG,
			"write v enc size: %d pts: %" PRId64 " dts: %" PRId64 " - to %f\n",
			enc_pkt.size, enc_pkt.pts, enc_pkt.dts,
			enc_pkt.pts*ostream->time_base.num/(double)ostream->time_base.den);
		
		pr->video_packets_written++;
		ret = av_interleaved_write_frame(pr->out_fctx, &enc_pkt);
		if (ret < 0) {
			av_log(NULL, AV_LOG_ERROR, "error while writing packet, error %d\n", ret);
			return ret;
		}
		
		av_frame_free(&frame);
		av_packet_unref(&enc_pkt);
	}
	
	if (got_frame_p)
		*got_frame_p = got_frame;
	
	return 0;
}

// calculate stream timestamp of frame using its PTS
double frame_pts2ts(struct project *pr, struct packet_buffer *s, AVFrame *frame) {
	return frame->pts * av_q2d(pr->in_fctx->streams[s->stream_index]->codec->time_base);
}

// check if pkt/frame at timestamp $ts shall be included
char ts_included(struct project *pr, double ts) {
	size_t i;
	
	// check if timestampe lies in a cut interval
	for (i=0; i < pr->n_cuts; i+=2) {
		if (pr->cuts[i] <= ts && ts < pr->cuts[i+1])
			return 0;
		
		// list is ordered
		if (ts < pr->cuts[i])
			return 1;
	}
	
	return 1;
}

#define BUF_COPY_COMPLETE 1<<0
#define BUF_DROP_COMPLETE 1<<1
#define BUF_CUT_IN_BETWEEN 1<<2

// check if the complete buffer will be used or if a cutpoint lies in this interval
char get_buffer_processing_mode(struct project *pr, struct packet_buffer *s, unsigned long last_iframe) {
	double buf_start, buf_end;
	size_t i;
	
	if (!last_iframe) {
		buf_start = s->pkts[0].pts * av_q2d(pr->in_fctx->streams[s->stream_index]->time_base);
		buf_end = s->pkts[s->n_pkts-1].pts * av_q2d(pr->in_fctx->streams[s->stream_index]->time_base);
	} else {
		buf_start = frame_pts2ts(pr, s, s->frames[0]);
		buf_end = frame_pts2ts(pr, s, s->frames[last_iframe]);
	}
	
	av_log(NULL, AV_LOG_DEBUG, "check buffer stream %u: %f to %f\n", s->stream_index, buf_start, buf_end);
	
	for (i=0; i < pr->n_cuts; i++) {
		// check if any cutpoint lies between buffer start and end
		if (buf_start < pr->cuts[i] && pr->cuts[i] < buf_end)
			return BUF_CUT_IN_BETWEEN;
		
		// check if buffer lies between cutpoints
		if (pr->cuts[i] <= buf_start && buf_end <= pr->cuts[i+1]) {
			if (i % 2 == 0)
				return BUF_DROP_COMPLETE;
			else
				return BUF_COPY_COMPLETE;
		}
		
		// stop if further cuts lie behind current buffer
		if (buf_end < pr->cuts[i])
			return BUF_COPY_COMPLETE;
	}
	
	av_log(NULL, AV_LOG_ERROR, "cannot determine processing mode\n");
	
	return -1;
}

// get the number of dropped frames prior to source timestamp $ts
double get_n_dropped_pkgs_at_ts(struct project *pr, struct packet_buffer *s, double ts) {
	size_t i;
	double result = 0;
	
	// we only consider positive values
	#define FLOOR(x) ( (double) ((long)(x)) )
	
	for (i=0; i < pr->n_cuts; i+=2) {
		if (pr->cuts[i+1] <= ts) {
			// TODO include or drop frame that would be cut in two pieces?
			// round down value as given cut points may not match the time base
			result += FLOOR((pr->cuts[i+1] - pr->cuts[i]) /
				av_q2d(pr->in_fctx->streams[s->stream_index]->time_base));
		} else {
			break;
		}
	}
	
// 	av_log(NULL, AV_LOG_DEBUG, "dropped pkgs at %f (tb %f): %f\n", ts,
// 		av_q2d(pr->in_fctx->streams[s->stream_index]->time_base), result);
	
	return result;
}

char find_packet_for_frame(struct packet_buffer *s, size_t frame_idx, size_t *packet_idx) {
	size_t i;
	
	for (i=0;i<s->n_pkts;i++) {
		// we cannot compare packet.dts with frame.pkt_dts as they differ by 2 (maybe caused by multithreading)
		if (
			(s->pkts[i].pts != AV_NOPTS_VALUE &&
				s->pkts[i].pts == s->frames[frame_idx]->pkt_pts) ||
			(s->pkts[i].pts == AV_NOPTS_VALUE && s->pkts[i].dts != AV_NOPTS_VALUE &&
				s->pkts[i].dts == s->frames[frame_idx]->coded_picture_number) ||
			(s->pkts[i].pts == AV_NOPTS_VALUE && s->pkts[i].dts == AV_NOPTS_VALUE &&
				s->frames[frame_idx]->pkt_size == s->pkts[i].size)
		)
		{
			#ifndef USING_LIBAV
			// libav is missing pkt_size
			if (s->frames[frame_idx]->pkt_size != s->pkts[i].size) {
				av_log(NULL, AV_LOG_ERROR,
					  "size mismatch %zu:%d %zu:%d\n",
						frame_idx, s->frames[frame_idx]->pkt_size, i,
						s->pkts[i].size);
				exit(1);
			}
			#endif
			
			*packet_idx = i;
// 			printf("found %zu %zu \n", i, s->frames[frame_idx]->pts);
			return 1;
		}
	}
	
	av_log(NULL, AV_LOG_ERROR, "packet for frame %zu (cpn %d) not found\n",
			frame_idx, s->frames[frame_idx]->coded_picture_number);
	
	for (i=0;i<s->n_pkts;i++) {
		av_log(NULL, AV_LOG_DEBUG, "%" PRId64 " %" PRId64 " %" PRId64 " %" PRId64 " - %d %d - %d (NOPTS: %" PRId64 ")\n",
				s->pkts[i].pts, s->pkts[i].dts, s->frames[frame_idx]->pkt_dts,
				s->frames[frame_idx]->pkt_pts,
				s->frames[frame_idx]->pkt_size, s->pkts[i].size,
				s->frames[frame_idx]->coded_picture_number,
				AV_NOPTS_VALUE);
	}
	
	return 0;
}

// process packet buffer - either copy, ignore or reencode packets in the packet buffer according to the cut list
void flush_packet_buffer(struct project *pr, struct packet_buffer *s, char last_flush) {
	size_t i, j, last_pkt;
	int ret;
	char buffer_mode = 0;
	double ts;
	size_t last_frame;
	
	
	if (!s->pkts || s->n_pkts == 0)
		return;
	
	if (pr->in_fctx->streams[s->stream_index]->codec->codec_type != AVMEDIA_TYPE_VIDEO) {
		// check if we can copy/drop the complete buffer or if we have to check each packet individually
		buffer_mode = get_buffer_processing_mode(pr, s, 0);
		
		for (i=0;i<s->n_pkts;i++) {
			ts = s->pkts[i].pts * av_q2d(pr->in_fctx->streams[s->stream_index]->time_base);
			
			if (pr->stop_after_ts < ts)
				s->stop_reading_stream = 1;
			
			if   ( !( buffer_mode & BUF_DROP_COMPLETE) &&
					( (buffer_mode & BUF_COPY_COMPLETE) || ts_included(pr, ts) )
				)
			{
				s->pkts[i].pts -= s->duration_dropped_pkts;
				
				// calculate duration precisely to avoid deviation between PTS and DTS
				double dur = s->pkts[i].duration * av_q2d(pr->in_fctx->streams[s->stream_index]->time_base) /
							av_q2d( pr->out_fctx->streams[s->stream_index]->time_base);
				
				av_packet_rescale_ts(&s->pkts[i], pr->in_fctx->streams[s->stream_index]->time_base,
								 pr->out_fctx->streams[s->stream_index]->time_base);
				
				#define ROUND(x) ((int64_t)((x)+0.5))
				s->pkts[i].dts = ROUND(s->next_dts);
				s->next_dts += dur;
				
				av_log(NULL, AV_LOG_DEBUG,
					"write a cpy pts: %" PRId64 " dts: %" PRId64 " - %f to %f\n",
					s->pkts[i].pts, s->pkts[i].dts, ts,
					s->pkts[i].pts * av_q2d(pr->out_fctx->streams[s->stream_index]->time_base));
				
				pr->other_packets_written++;
				ret = av_interleaved_write_frame(pr->out_fctx, &s->pkts[i]);
				if (ret < 0) {
					av_log(NULL, AV_LOG_ERROR, "error while writing packet, error %d\n", ret);
					exit(ret);
				}
			} else {
				s->duration_dropped_pkts += s->pkts[i].duration;
			}
			
			av_packet_unref(&s->pkts[i]);
		}
		
		s->n_pkts = 0;
		return;
	}
	
	if (s->n_frames > 1) {
		// If this is the last flush, process all frames. If not, ignore the last
		// frame (that is an I frame) as we process it during the next buffer flush
		if (last_flush)
			last_frame = s->n_frames-1;
		else
			last_frame = s->n_frames-2;
		
		// check if we can copy the complete buffer or if we have to check each packet individually
		buffer_mode = get_buffer_processing_mode(pr, s, last_frame);
	} else {
		buffer_mode = BUF_COPY_COMPLETE;
	}
	
	// determine the last packet we have to look at for this GOP
	if (last_flush) {
		// we consider all packets during the last flush
		last_pkt = s->n_pkts-1;
	} else {
		// find the packet with the highest DTS in this GOP
		
		/*
		 * The packet that belongs to the last frame in a GOP might not have
		 * the highest DTS of the GOP's packets. Hence, we search backwards
		 * for the packet with the highest DTS. Otherwise, we might miss packets,
		 * e.g., if the last frame is a P frame, its DTS is lower as the DTS
		 * of the preceding B frames.
		 * 
		 * We stop with the search if we have found two P frames or after a
		 * B frame and a P frame has been found.
		 */
		
		size_t pkt_idx;
		char b_found = 0;
		char n_p_frames = 0;
		
		last_pkt = 0;
		for (i = s->n_frames-2; i > 0; i--) {
			if (s->frames[i]->pict_type == AV_PICTURE_TYPE_B)
				b_found=1;
			if (s->frames[i]->pict_type == AV_PICTURE_TYPE_P) {
				n_p_frames++;
				if (b_found || n_p_frames > 2)
					break;
			}
			
			if (!find_packet_for_frame(s, i, &pkt_idx))
				exit(1);
			if (pkt_idx > last_pkt)
				last_pkt = pkt_idx;
		}
		
		if (buffer_mode & BUF_CUT_IN_BETWEEN) {
			// if we encode all frames we don't need the original packets
			for (i=0;i<=last_pkt;i++)
				av_packet_unref(&s->pkts[i]);
		}
	}
	
	// TODO: check if we can simply cut if the last frame is a P-frame
	
	if (buffer_mode & BUF_CUT_IN_BETWEEN) {
		char frame_written = 0;
		
		// check which frames will be included and encode them
		for (i=0;i<s->n_frames-1;i++) {
			if (!s->frames[i]) {
				av_log(NULL, AV_LOG_ERROR, "no frame %zu\n", i);
				exit(1);
			}
			
			ts = frame_pts2ts(pr, s, s->frames[i]);
			
			// calculate new PTS
			s->frames[i]->pts -= av_rescale_q(s->duration_dropped_pkts,
						pr->in_fctx->streams[s->stream_index]->time_base,
						pr->in_fctx->streams[s->stream_index]->codec->time_base);
			
			if (pr->stop_after_ts < ts)
				s->stop_reading_stream = 1;
			
			if (ts_included(pr, ts)) {
				#ifndef USING_LIBAV
				s->frames[i]->pict_type = AV_PICTURE_TYPE_NONE;
				#else
				s->frames[i]->pict_type = 0;
				#endif
				
				ret = encode_write_frame(pr, s, s->frames[i], 0);
				if (ret < 0) {
					av_log(NULL, AV_LOG_ERROR, "encode_write_frame failed, error %d\n", ret);
					exit(ret);
				}
				
				frame_written = 1;
			} else {
				s->duration_dropped_pkts += av_frame_get_pkt_duration(s->frames[i]);
				av_frame_free(&s->frames[i]);
			}
		}
		
		// if the encoder emits packets delayed in time, flush the encoder to receive all remaining packets in the queue
		if (frame_written && pr->out_fctx->streams[s->stream_index]->codec->codec->capabilities & CODEC_CAP_DELAY) {
			av_log(NULL, AV_LOG_DEBUG, "Local flushing stream #%u\n", s->stream_index);
			while (1) {
				int got_frame;
				
				ret = encode_write_frame(pr, s, 0, &got_frame);
				if (ret < 0) {
					#ifndef USING_LIBAV
					av_log(NULL, AV_LOG_ERROR, "encode_write_frame failed, error %d: %s\n", ret, av_err2str(ret));
					#else
					char errbuf[256];
					av_strerror(ret, errbuf, 256);
					av_log(NULL, AV_LOG_ERROR, "encode_write_frame failed, error %d: %s\n", ret, errbuf);
					#endif
					exit(ret);
				}
				if (!got_frame) {
					av_log(NULL, AV_LOG_DEBUG, "flush end\n");
					break;
				}
			}
		}
		
		if (frame_written) {
			// Some encoders do not like new frames after we flushed them.
			// Hence, we restart the encoder.
			AVCodecContext *out_cctx = pr->out_fctx->streams[s->stream_index]->codec;
			
			out_cctx->codec->close(out_cctx);
			out_cctx->codec->init(out_cctx);
		}
	} else
	if (buffer_mode & BUF_COPY_COMPLETE) {
		for (i=0;i<=last_pkt;i++) {
			AVFrame *frame;
			
			// find frame for current packet to determine the PTS
			frame = 0;
			for (j=0;j<s->n_frames;j++) {
				if (
					(s->pkts[i].pts != AV_NOPTS_VALUE &&
						s->pkts[i].pts == s->frames[j]->pkt_pts) ||
					(s->pkts[i].pts == AV_NOPTS_VALUE && s->pkts[i].dts != AV_NOPTS_VALUE &&
						s->pkts[i].dts == s->frames[j]->coded_picture_number) ||
					(s->pkts[i].pts == AV_NOPTS_VALUE && s->pkts[i].dts == AV_NOPTS_VALUE &&
						s->frames[j]->pkt_size == s->pkts[i].size)
					)
				{
					#ifndef USING_LIBAV
					// libav is missing pkt_size
					if (s->frames[j]->pkt_size != s->pkts[i].size) {
						av_log(NULL, AV_LOG_ERROR,
							"size mismatch %zu:%d %zu:%d (dts %" PRId64 ")\n",
							j, s->frames[j]->pkt_size, i, s->pkts[i].size, s->pkts[i].dts);
						exit(1);
					}
					#endif
					
					frame = s->frames[j];
					break;
				}
			}
			if (!frame) {
				av_log(NULL, AV_LOG_ERROR,
					"frame for pkt #%zd (dts %" PRId64 " pts %" PRId64 ") not found\n",
					i, s->pkts[i].dts, s->pkts[i].pts);
				
				av_log(NULL, AV_LOG_DEBUG, "pkt_pts pkt_dts frame->pkt_dts frame->pkt_pts - frame->pkt_size pkt_size - cpn\n");
				for (j=0;j<s->n_frames;j++) {
					av_log(NULL, AV_LOG_DEBUG, "%" PRId64 " %" PRId64 " %" PRId64 " %" PRId64 " - %6d %6d - %d type: %c (NOPTS: %" PRId64 ")\n",
						s->pkts[i].pts, s->pkts[i].dts, s->frames[j]->pkt_dts,
						s->frames[j]->pkt_pts,
						s->frames[j]->pkt_size, s->pkts[i].size,
						s->frames[j]->coded_picture_number,
						av_get_picture_type_char(s->frames[j]->pict_type),
						AV_NOPTS_VALUE);
				}
				
				exit(1);
			}
			
			s->pkts[i].pts = av_rescale_q(frame->pts,
					pr->in_fctx->streams[s->stream_index]->codec->time_base,
					pr->in_fctx->streams[s->stream_index]->time_base);
			
			ts = frame_pts2ts(pr, s, s->frames[i]);
			
			if (pr->stop_after_ts < ts)
				s->stop_reading_stream = 1;
			
			if (ts_included(pr, ts)) {
				s->pkts[i].pts -= s->duration_dropped_pkts;
				
				// calculate duration precisely to avoid deviation between PTS and DTS
				double dur = s->pkts[i].duration * av_q2d(pr->in_fctx->streams[s->stream_index]->time_base) /
					av_q2d( pr->out_fctx->streams[s->stream_index]->time_base);
				
				av_packet_rescale_ts(&s->pkts[i], pr->in_fctx->streams[s->stream_index]->time_base,
								 pr->out_fctx->streams[s->stream_index]->time_base);
				
				s->pkts[i].dts = s->next_dts;
				s->next_dts += dur;
				
				// if the original h264 stream is in AVCC format, convert it to Annex B
				if (pr->in_fctx->streams[s->stream_index]->codec->opaque &&
					((struct codeccontext*) pr->in_fctx->streams[s->stream_index]->codec->opaque)->h264_avcc_format)
				{
					av_bitstream_filter_filter(pr->bsf_h264_to_annexb,
						pr->in_fctx->streams[s->stream_index]->codec, NULL,
						&s->pkts[i].data, &s->pkts[i].size, s->pkts[i].data, s->pkts[i].size,
						s->pkts[i].flags & AV_PKT_FLAG_KEY);
				}
				
				av_log(NULL, AV_LOG_DEBUG,
					"write v cpy size: %d pts: %" PRId64 " dts: %" PRId64 " - %f to %f\n",
					s->pkts[i].size, s->pkts[i].pts, s->pkts[i].dts, ts,
					s->pkts[i].pts * pr->out_fctx->streams[s->stream_index]->time_base.num /
						(double)pr->out_fctx->streams[s->stream_index]->time_base.den
					);
				
				pr->video_packets_written++;
				ret = av_interleaved_write_frame(pr->out_fctx, &s->pkts[i]);
				if (ret < 0) {
					av_log(NULL, AV_LOG_ERROR, "error while writing packet, error %d\n", ret);
					exit(ret);
				}
			} else {
				s->duration_dropped_pkts += s->pkts[i].duration;
			}
			
			av_packet_unref(&s->pkts[i]);
		}
		
		for (j=0;j<s->n_frames-1;j++)
			av_frame_free(&s->frames[j]);
	} else {
		for (i=0;i<=last_pkt;i++) {
			s->duration_dropped_pkts += s->pkts[i].duration;
			av_packet_unref(&s->pkts[i]);
		}
		
		for (j=0;j<s->n_frames-1;j++)
			av_frame_free(&s->frames[j]);
	}
	
	// update buffer structures
	AVPacket *newpkts = (AVPacket*) av_realloc(0, sizeof(AVPacket)*s->length);
	j = 0;
	for (i=0;i<s->n_pkts;i++) {
		if (s->pkts[i].size != 0 && s->pkts[i].data != NULL) {
			memcpy(&newpkts[j], &s->pkts[i], sizeof(AVPacket));
			j++;
		}
	}
	av_freep(&s->pkts);
	s->pkts = newpkts;
	s->n_pkts = j;
	
	s->frames[0] = s->frames[s->n_frames-1];
	s->n_frames = 1;
}

// decode a video packet and store it in the buffer
int decode_packet(struct project *pr, struct packet_buffer *sbuffer, unsigned int stream_index, AVPacket *packet) {
	enum AVMediaType mtype;
	int got_frame, ret, i;
	AVFrame *frame = NULL;
	AVPacket nullpacket = { .data = NULL, .size = 0 };
	
	if (!packet)
		packet = &nullpacket;
	
	mtype = pr->in_fctx->streams[stream_index]->codec->codec_type;
	
	got_frame = 0;
	if (mtype == AVMEDIA_TYPE_VIDEO) {
		if (!(frame = av_frame_alloc())) {
			av_log(NULL, AV_LOG_ERROR, "error while allocating frame\n");
			return AVERROR(ENOMEM);
		}
		
		ret = avcodec_decode_video2(pr->in_fctx->streams[stream_index]->codec, frame, &got_frame, packet);
		
		if (ret < 0) {
			av_frame_free(&frame);
			av_log(NULL, AV_LOG_ERROR, "Decoding frame failed\n");
			return ret;
		}
		
		if (got_frame) {
// 			av_log(NULL, AV_LOG_DEBUG, "dec frame pts: %" PRId64 " pkt_pts: %" PRId64 " pkt_dts: %" PRId64 " pkt_size: %d type: %c to %f\n",
// 				  frame->pts, frame->pkt_pts, frame->pkt_dts, frame->pkt_size, av_get_picture_type_char(frame->pict_type),
// 				  frame->pts*av_q2d(pr->in_fctx->streams[stream_index]->codec->time_base)
// 			);
			
			sbuffer[stream_index].frames[sbuffer[stream_index].n_frames] = frame;
			sbuffer[stream_index].n_frames++;
			
			pr->video_packets_decoded++;
			
			#ifndef USING_LIBAV
			frame->pts = av_frame_get_best_effort_timestamp(frame);
			#else
			if (frame->pkt_pts != AV_NOPTS_VALUE)
				frame->pts = frame->pkt_pts;
			else
				frame->pts = frame->pkt_dts;
			#endif
			
			// convert from packet to frame time_base, if necessary
			if (frame->pts == frame->pkt_dts || frame->pts == frame->pkt_pts)
				frame->pts = av_rescale_q(frame->pts,
							pr->in_fctx->streams[stream_index]->time_base,
							pr->in_fctx->streams[stream_index]->codec->time_base);
			
			// The last frames in some AVIs have a DTS of zero. Here, we
			// override the PTS (copied from DTS) in such a case to provide
			// an increasing PTS
			if (frame->pts < sbuffer->last_pts) {
				int64_t new_pts = sbuffer->last_pts + av_rescale_q(frame->pkt_duration,
					pr->in_fctx->streams[stream_index]->time_base,
					pr->in_fctx->streams[stream_index]->codec->time_base);
				av_log(NULL, AV_LOG_DEBUG, "adjusting frame PTS from %" PRId64 " to %" PRId64 "\n", frame->pts, new_pts);
				frame->pts = new_pts;
			}
			
			sbuffer->last_pts = frame->pts;
			
			// the first packet in the video buffer is an I frame, if the
			// current packet contains another I frame, flush the buffer
			if (sbuffer[stream_index].n_frames > 1 && frame->key_frame) {
				if (pr->last_flush == 1)
					pr->stop_reading = 1;
				
				char n_finished_streams = 0;
				for (i = 0; i < pr->n_stream_ids; i++) {
					flush_packet_buffer(pr, &sbuffer[i], 0);
					
					if (sbuffer[i].stop_reading_stream)
						n_finished_streams++;
				}
				
				if (n_finished_streams == pr->n_stream_ids)
					pr->last_flush = 1;
			}
		} else {
			av_frame_free(&frame);
		}
	}
	
	return got_frame;
}

int main(int argc, char **argv) {
	unsigned int i, j;
	int ret;
	char *inputf, *outputf;
	struct project project;
	struct project *pr;
	
	if (argc < 3) {
		av_log(NULL, AV_LOG_INFO, "avcut-" AVCUT_VERSION " - Frame-accurate video cutting with only small quality loss\n\n");
		av_log(NULL, AV_LOG_INFO, "Usage: %s <input file> <output file> [<drop_from_ts> <continue_with_ts> ...]\n", argv[0]);
		return 1;
	}
	
	if (argc % 2 != 1) {
		av_log(NULL, AV_LOG_ERROR, "only even number of cut points allowed\n");
		av_log(NULL, AV_LOG_ERROR, "Usage: %s <input file> <output file> [<drop_from_ts> <continue_with_ts> ...]\n", argv[0]);
		return 1;
	}
	
	inputf = argv[1];
	outputf = argv[2];
	
	pr = &project;
	memset(pr, 0, sizeof(struct project));
	
	pr->n_cuts = argc - 3;
	pr->cuts = (double*) malloc(sizeof(double)*pr->n_cuts);
	pr->stop_after_ts = DBL_MAX;
	pr->last_flush = 0;
	
	for (i=3; i < argc; i++) {
		char *end;
		if ((i % 2 == 0) && !strcmp(argv[i], "-")) {
			pr->stop_after_ts = pr->cuts[i-4];
			pr->cuts[i-3] = DBL_MAX;
		} else {
			pr->cuts[i-3] = strtod(argv[i], &end);
			if (end == argv[i] || *end != 0) {
				av_log(NULL, AV_LOG_ERROR, "error while parsing cut point: %s\n", argv[i]);
			}
		}
	}
	
	#ifdef DEBUG
	av_log_set_level(AV_LOG_DEBUG);
	#else
	if (getenv("AVCUT_VERBOSITY")) {
		av_log_set_level(atoi(getenv("AVCUT_VERBOSITY")));
	}
	#endif
	
	av_register_all();
	
	/*
	 * open input file
	 */
	
	pr->in_fctx = 0;
	if ((ret = avformat_open_input(&pr->in_fctx, inputf, NULL, NULL)) < 0) {
		av_log(NULL, AV_LOG_ERROR, "cannot open input file, error %d\n", ret);
		return ret;
	}
	
	if ((ret = avformat_find_stream_info(pr->in_fctx, NULL)) < 0) {
		av_log(NULL, AV_LOG_ERROR, "Cannot get stream info, error %d\n", ret);
		return ret;
	}
	
	pr->n_stream_ids = 0;
	pr->stream_ids = 0;
	
	for (i = 0; i < pr->in_fctx->nb_streams; i++) {
		AVCodecContext *codec_ctx;
		
		codec_ctx = pr->in_fctx->streams[i]->codec;
		
		// we buffer multiple frames, this avoids that avcodec_decode_video2 overwrites our data
		codec_ctx->refcounted_frames = 1;
		
		if (codec_ctx->codec_type == AVMEDIA_TYPE_VIDEO) { // || codec_ctx->codec_type == AVMEDIA_TYPE_AUDIO) {
			ret = avcodec_open2(codec_ctx, avcodec_find_decoder(codec_ctx->codec_id), NULL);
			if (ret < 0) {
				av_log(NULL, AV_LOG_ERROR, "Failed to open decoder for stream %u, error %d\n", i, ret);
				return ret;
			}
			
			// detect h264 format
			if (codec_ctx->codec_id == AV_CODEC_ID_H264 && codec_ctx->extradata_size > 2) {
				char nalu_start_code1[] = {0x0,0x0,0x1};
				char nalu_start_code2[] = {0x0,0x0,0x0,0x1};
				
				// AVCUT_DUMP_CHAR(codec_ctx->extradata, 4);
				
				struct codeccontext *cctx;
				cctx = av_malloc(sizeof(struct codeccontext));
				if (!cctx) {
					av_log(NULL, AV_LOG_ERROR, "malloc codeccontext failed\n");
					return AVERROR_UNKNOWN;
				}
				codec_ctx->opaque = cctx;
				
// 				for (j=0;j<16;j++) printf("%x ", codec_ctx->extradata[j] ); printf("\n");
				
				if (!memcmp(codec_ctx->extradata, nalu_start_code1, 3) ||
					!memcmp(codec_ctx->extradata, nalu_start_code2, 4))
				{
					cctx->h264_avcc_format = 0;
					av_log(NULL, AV_LOG_DEBUG, "detected h264 in annexb format\n");
				} else {
					cctx->h264_avcc_format = 1;
					av_log(NULL, AV_LOG_DEBUG, "detected h264 in avcc format\n");
				}
			}
		}
		
		switch (codec_ctx->codec_type) {
			case AVMEDIA_TYPE_VIDEO:
			case AVMEDIA_TYPE_AUDIO:
			case AVMEDIA_TYPE_SUBTITLE:
				pr->n_stream_ids++;
				pr->stream_ids = (unsigned int*) realloc(pr->stream_ids, sizeof(unsigned int)*pr->n_stream_ids);
				pr->stream_ids[pr->n_stream_ids-1] = i;
				break;
			default: break;
		}
	}
	
	av_dump_format(pr->in_fctx, 0, inputf, 0);
	
	/*
	 * open output file
	 */
	
	{
		struct stat st;
		if (stat(outputf, &st) == 0) {
			av_log(NULL, AV_LOG_ERROR, "error, output file \"%s\" already exists\n", outputf);
			exit(1);
		}
	}
	
	#ifndef USING_LIBAV
	avformat_alloc_output_context2(&pr->out_fctx, NULL, NULL, outputf);
	#else
	pr->out_fctx = avformat_alloc_context();
	#endif
	if (!pr->out_fctx) {
		av_log(NULL, AV_LOG_ERROR, "Could not create output context\n");
		return AVERROR_UNKNOWN;
	}
	
	#ifdef USING_LIBAV
	av_strlcpy(pr->out_fctx->filename, outputf, sizeof(pr->out_fctx->filename));
	pr->out_fctx->oformat = av_guess_format(NULL, outputf, NULL);
	if (!pr->out_fctx->oformat) {
		avformat_free_context(pr->out_fctx);
		av_log(NULL, AV_LOG_ERROR, "Could not determine output format\n");
		return AVERROR_UNKNOWN;
	}
	#endif
	
	// copy most properties from the input streams to the output streams
	for (j = 0; j < pr->n_stream_ids; j++) {
		AVStream *out_stream;
		AVCodecContext *dec_cctx, *enc_cctx;
		
		i = pr->stream_ids[j];
		
// 		if (pr->in_fctx->streams[i]->disposition & AV_DISPOSITION_ATTACHED_PIC)
// 			continue;
		
		out_stream = avformat_new_stream(pr->out_fctx, NULL);
		if (!out_stream) {
			av_log(NULL, AV_LOG_ERROR, "Failed allocating output stream\n");
			return AVERROR_UNKNOWN;
		}
		
		dec_cctx = pr->in_fctx->streams[i]->codec;
		enc_cctx = out_stream->codec;
		
		out_stream->time_base = pr->in_fctx->streams[i]->time_base;
		
		// copy stream metadata
		av_dict_copy(&out_stream->metadata, pr->in_fctx->streams[i]->metadata, 0);
		
		if (dec_cctx->codec_type == AVMEDIA_TYPE_VIDEO) {
			AVCodec *encoder;
			
			encoder = avcodec_find_encoder(dec_cctx->codec_id);
			if (!encoder) {
				av_log(NULL, AV_LOG_ERROR, "Encoder not found\n");
				return AVERROR_INVALIDDATA;
			}
			
			ret = avcodec_copy_context(enc_cctx, dec_cctx);
			if (ret < 0) {
				av_log(NULL, AV_LOG_ERROR, "Copying stream context failed\n");
				return ret;
			}
			
			// TODO good values?
			enc_cctx->qmin = 16;
			enc_cctx->qmax = 26;
			enc_cctx->max_qdiff = 4;
			if (dec_cctx->has_b_frames) {
				enc_cctx->max_b_frames = 3;
				if (pr->has_b_frames < dec_cctx->has_b_frames)
					pr->has_b_frames = dec_cctx->has_b_frames;
			}
// 			enc_cctx->keyint_min = 200;
// 			enc_cctx->gop_size = 250;
			enc_cctx->thread_count = 1; // spawning more threads causes avcodec_close to free threads multiple times
			enc_cctx->codec_tag = 0; // reset tag to avoid incompatibilities while changing container
			
			out_stream->sample_aspect_ratio = pr->in_fctx->streams[i]->sample_aspect_ratio;
			
			if (pr->out_fctx->oformat->flags & AVFMT_GLOBALHEADER)
				enc_cctx->flags |= CODEC_FLAG_GLOBAL_HEADER;
			
			ret = avcodec_open2(enc_cctx, encoder, NULL);
			if (ret < 0) {
				av_log(NULL, AV_LOG_ERROR, "Failed to open encoder for stream %u, error %d\n", i, ret);
				return ret;
			}
		} else if (dec_cctx->codec_type == AVMEDIA_TYPE_UNKNOWN) {
			av_log(NULL, AV_LOG_ERROR, "Error: input stream #%d is of unknown type\n", i);
			return AVERROR_INVALIDDATA;
		} else {
			ret = avcodec_copy_context(pr->out_fctx->streams[j]->codec, pr->in_fctx->streams[i]->codec);
			if (ret < 0) {
				av_log(NULL, AV_LOG_ERROR, "Copying codec context failed, error %d\n", ret);
				return ret;
			}
			
			enc_cctx->codec_tag = 0;
			
			if (pr->out_fctx->oformat->flags & AVFMT_GLOBALHEADER)
				enc_cctx->flags |= CODEC_FLAG_GLOBAL_HEADER;
		}
	}
	
	// initialize bitstream filters
	pr->bsf_h264_to_annexb = av_bitstream_filter_init("h264_mp4toannexb");
	pr->bsf_dump_extra = av_bitstream_filter_init("dump_extra");
	if (!pr->bsf_dump_extra || !pr->bsf_h264_to_annexb) {
		av_log(NULL, AV_LOG_ERROR, "error while initializing bitstream filters \"dump_extra\" and \"h264_mp4toannexb\"\n");
		exit(1);
	}
	
	if (!(pr->out_fctx->oformat->flags & AVFMT_NOFILE)) {
		ret = avio_open(&pr->out_fctx->pb, outputf, AVIO_FLAG_WRITE);
		if (ret < 0) {
			av_log(NULL, AV_LOG_ERROR, "Cannot open output file '%s', error %d\n", outputf, ret);
			return ret;
		}
	}
	
	// copy main metadata
	av_dict_copy(&pr->out_fctx->metadata, pr->in_fctx->metadata, 0);
	
	av_dump_format(pr->out_fctx, 0, outputf, 1);
	
	ret = avformat_write_header(pr->out_fctx, NULL);
	if (ret < 0) {
		av_log(NULL, AV_LOG_ERROR, "Cannot write header to '%s', error %d\n", outputf, ret);
		return ret;
	}
	
	for (j = 0; j < pr->n_stream_ids; j++) {
		i = pr->stream_ids[j];
		
		#define DUMP_TB(tb) "%5d / %5d\n", (tb)->num, (tb)->den
		av_log(NULL, AV_LOG_DEBUG, "\n");
		av_log(NULL, AV_LOG_DEBUG, "stream %d in:\n", i);
		av_log(NULL, AV_LOG_DEBUG, "stream: " DUMP_TB(&pr->in_fctx->streams[i]->time_base));
		av_log(NULL, AV_LOG_DEBUG, "codec:  " DUMP_TB(&pr->in_fctx->streams[i]->codec->time_base));
		av_log(NULL, AV_LOG_DEBUG, "ticks_per_frame: %d\n", pr->in_fctx->streams[i]->codec->ticks_per_frame);
		av_log(NULL, AV_LOG_DEBUG, "stream %d out:\n", j);
		av_log(NULL, AV_LOG_DEBUG, "stream: " DUMP_TB(&pr->out_fctx->streams[j]->time_base));
		av_log(NULL, AV_LOG_DEBUG, "codec:  " DUMP_TB(&pr->out_fctx->streams[j]->codec->time_base));
		av_log(NULL, AV_LOG_DEBUG, "ticks_per_frame: %d\n", pr->out_fctx->streams[j]->codec->ticks_per_frame);
	}
	av_log(NULL, AV_LOG_DEBUG, "\n");
	
	
	struct packet_buffer *sbuffer;
	sbuffer = (struct packet_buffer*) av_calloc(1, sizeof(struct packet_buffer) * pr->n_stream_ids);
	
	long dts_offset = 0;
	if (pr->has_b_frames) {
		// determine a safe starting value for the DTS from the GOP size
		
		long newo;
		for (j = 0; j < pr->n_stream_ids; j++) {
			i = pr->stream_ids[j];
			// use -gop_size as start for DTS
			newo = pr->in_fctx->streams[i]->codec->gop_size;
			newo = 0 - pr->out_fctx->streams[j]->codec->ticks_per_frame * 
				av_rescale_q(newo, pr->out_fctx->streams[j]->codec->time_base, pr->out_fctx->streams[j]->time_base);
			if (newo < dts_offset)
				dts_offset = newo;
		}
	}
	
	// set the initial DTS for each stream
	for (j = 0; j < pr->n_stream_ids; j++) {
		sbuffer[j].next_dts = dts_offset;
		av_log(NULL, AV_LOG_DEBUG, "initial DTS %u: %.0f\n", j, sbuffer[j].next_dts);
	}
	
	// start processing the input
	pr->stop_reading = 0;
	while (!pr->stop_reading) {
		unsigned int stream_index;
		AVPacket packet = { .data = NULL, .size = 0 };
		
		if ((ret = av_read_frame(pr->in_fctx, &packet)) < 0) {
			if (ret != AVERROR_EOF)
				av_log(NULL, AV_LOG_ERROR, "error while reading next frame: %d\n", ret);
			break;
		}
		
		if (pr->in_fctx->streams[packet.stream_index]->codec->codec_type == AVMEDIA_TYPE_VIDEO)
			pr->video_packets_read++;
		else
			pr->other_packets_read++;
		
		// calculate output stream_index from packet's input stream_index
		for (i=0; i<pr->n_stream_ids; i++) {
			if (pr->stream_ids[i] == packet.stream_index) {
				stream_index = i;
				break;
			}
		}
		if (i==pr->n_stream_ids) {
			// skip packet
			continue;
		}
		
		// check if our buffer is large enough
		if (sbuffer[stream_index].n_pkts == sbuffer[stream_index].length) {
			if (sbuffer[stream_index].pkts == 0)
				sbuffer[stream_index].length = 4;
			sbuffer[stream_index].length *= 2;
			sbuffer[stream_index].pkts = (AVPacket*) av_realloc(sbuffer[stream_index].pkts,
					sizeof(AVPacket)*sbuffer[stream_index].length);
			sbuffer[stream_index].frames = (AVFrame**) av_realloc(sbuffer[stream_index].frames,
					sizeof(AVFrame*)*sbuffer[stream_index].length);
			sbuffer[stream_index].stream_index = stream_index;
		}
		
		memcpy(&sbuffer[stream_index].pkts[sbuffer[stream_index].n_pkts], &packet, sizeof(AVPacket));
		sbuffer[stream_index].n_pkts++;
		
		// decode packet (and start flushing the buffer if necessary)
		ret = decode_packet(pr, sbuffer, stream_index, &packet);
		if (ret < 0)
			return ret;
	}
	
	av_log(NULL, AV_LOG_DEBUG, "flushing decoder...\n");
	
	// if no more packet can be read, there might be still data in the queues, hence flush them if necessary
	for (j = 0; j < pr->n_stream_ids; j++) {
		if (!pr->out_fctx->streams[j]->codec->codec || !(pr->out_fctx->streams[j]->codec->codec->capabilities & CODEC_CAP_DELAY))
			continue;
		
		while (1) {
			ret = decode_packet(pr, sbuffer, j, 0);
			if (ret == 0)
				break;
			if (ret < 0)
				return ret;
		}
	}
	
	av_log(NULL, AV_LOG_DEBUG, "flushing buffer...\n");
	
	// more flushing
	for (j = 0; j < pr->n_stream_ids; j++)
		flush_packet_buffer(pr, &sbuffer[j], 1);
	
	// conclude writing
	av_write_trailer(pr->out_fctx);
	
	/*
	 * cleanup
	 */
	
	av_bitstream_filter_close(pr->bsf_h264_to_annexb);
	av_bitstream_filter_close(pr->bsf_dump_extra);
	
	for (j = 0; j < pr->n_stream_ids; j++) {
		av_freep(&sbuffer[j].pkts);
		av_freep(&sbuffer[j].frames);
		
		if (pr->out_fctx->streams[j]->codec && avcodec_is_open(pr->out_fctx->streams[j]->codec))
			avcodec_close(pr->out_fctx->streams[j]->codec);
	}
	
	for (i = 0; i < pr->in_fctx->nb_streams; i++) {
		if (pr->in_fctx->streams[i]->codec) {
			av_freep(&pr->in_fctx->streams[i]->codec->opaque);
			if (avcodec_is_open(pr->in_fctx->streams[i]->codec))
				avcodec_close(pr->in_fctx->streams[i]->codec);
		}
	}
	
	avformat_close_input(&pr->in_fctx);
	if (!(pr->out_fctx->oformat->flags & AVFMT_NOFILE))
		avio_closep(&pr->out_fctx->pb);
	avformat_free_context(pr->out_fctx);
	
	av_log(NULL, AV_LOG_INFO, "Video packets read: %zu\n", pr->video_packets_read);
	av_log(NULL, AV_LOG_INFO, "Video packets decoded: %zu\n", pr->video_packets_decoded);
	av_log(NULL, AV_LOG_INFO, "Video frames encoded: %zu\n", pr->video_frames_encoded);
	av_log(NULL, AV_LOG_INFO, "Video packets written: %zu\n", pr->video_packets_written);
	av_log(NULL, AV_LOG_INFO, "Other packets read: %zu\n", pr->other_packets_read);
	av_log(NULL, AV_LOG_INFO, "Other packets written: %zu\n", pr->other_packets_written);
	
	if (pr->n_cuts > 0) {
		struct stat st;
		size_t size, outputf_len;
		FILE *check_script = 0;
		
		stat(inputf, &st);
		size = st.st_size;
		stat(outputf, &st);
		av_log(NULL, AV_LOG_INFO, "\nFile size reduction: %f MB\n", (size - (double) st.st_size) / (1000*1000) );
		
		// print some info to check the cutpoints of the resulting video
		av_log(NULL, AV_LOG_INFO, "\ncutting points in \"%s\" at: ", outputf);
		double removed = 0;
		for (i=0;i<pr->n_cuts;i+=2) {
			double c = pr->cuts[i]-removed;
			av_log(NULL, AV_LOG_INFO, "%fs (%um %2us) ", c, (unsigned int)c/60, (unsigned int)c % 60);
			
			removed += pr->cuts[i+1] - pr->cuts[i];
		}
		av_log(NULL, AV_LOG_INFO, "\n");
		
		printf("\nYou can check the cutting points with:\nmpv \"edl://");
		
		if (getenv("AVCUT_CHECK_SCRIPT") && atoi(getenv("AVCUT_CHECK_SCRIPT"))) {
			check_script = fopen("avcut_check_cutpoints.sh", "a");
			fprintf(check_script, "mpv \"edl://");
		}
		
		outputf_len = strlen(outputf);
		removed = 0;
		for (i=0;i<pr->n_cuts;i+=2) {
			double c = pr->cuts[i]-removed;
			
			printf("%%%zu%%%s,%f,%f;", outputf_len, outputf, (c>=10 ? c-10 : 0 ), (c>=10 ? 20 : c + 10));
			
			if (check_script)
				fprintf(check_script, "%%%zu%%%s,%f,%f;", outputf_len, outputf, (c>=10 ? c-10 : 0 ), (c>=10 ? 20 : c + 10));
			
			removed += pr->cuts[i+1] - pr->cuts[i];
		}
		if (check_script)
			fprintf(check_script, "\"\n\n");
		
		printf("\"\n");
	}
	
	av_freep(&pr->cuts);
	av_freep(&sbuffer);
	
	return 0;
}