forked from colin121/x264-dsp
-
Notifications
You must be signed in to change notification settings - Fork 0
/
input.c
239 lines (214 loc) · 6.24 KB
/
input.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
/*****************************************************************************
* input.c: encoder input modules
*****************************************************************************/
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <stdint.h>
#include "config.h"
#include "common/x264.h"
#include "input.h"
#include "downsample.h"
#ifdef BIN2C
#include "yuv.h"
static char *p_yuv = (char *)yuv;
#endif
typedef struct
{
const char *name;
int planes;
float width[4];
float height[4];
int mod_width;
int mod_height;
} x264_cli_csp_t;
static const x264_cli_csp_t x264_cli_csps[] = {
[X264_CSP_I420] = {"i420", 3, {1, .5, .5}, {1, .5, .5}, 2, 2},
[X264_CSP_I422] = {"i422", 3, {1, .5, .5}, {1, 1, 1}, 2, 1},
[X264_CSP_I444] = {"i444", 3, {1, 1, 1}, {1, 1, 1}, 1, 1},
[X264_CSP_YV12] = {"yv12", 3, {1, .5, .5}, {1, .5, .5}, 2, 2},
[X264_CSP_YV16] = {"yv16", 3, {1, .5, .5}, {1, 1, 1}, 2, 1},
[X264_CSP_YV24] = {"yv24", 3, {1, 1, 1}, {1, 1, 1}, 1, 1},
[X264_CSP_NV12] = {"nv12", 2, {1, 1}, {1, .5}, 2, 2},
[X264_CSP_NV16] = {"nv16", 2, {1, 1}, {1, 1}, 2, 1},
[X264_CSP_BGR] = {"bgr", 1, {3}, {1}, 1, 1},
[X264_CSP_BGRA] = {"bgra", 1, {4}, {1}, 1, 1},
[X264_CSP_RGB] = {"rgb", 1, {3}, {1}, 1, 1},
};
static int x264_cli_csp_is_invalid(int csp) {
int csp_mask = csp & X264_CSP_MASK;
return csp_mask <= X264_CSP_NONE || csp_mask >= X264_CSP_MAX;
}
static int x264_cli_csp_depth_factor(int csp) {
if (x264_cli_csp_is_invalid(csp))
return 0;
/* the csp has a depth of 8 or 16 bits per pixel component */
return (csp & X264_CSP_HIGH_DEPTH) ? 2 : 1;
}
static uint64_t x264_cli_pic_plane_size(int csp, int width, int height, int plane) {
uint64_t size = (uint64_t)width * height;
int csp_mask = csp & X264_CSP_MASK;
if (x264_cli_csp_is_invalid(csp) || plane < 0 || plane >= x264_cli_csps[csp_mask].planes)
return 0;
size *= x264_cli_csps[csp_mask].width[plane] * x264_cli_csps[csp_mask].height[plane];
size *= x264_cli_csp_depth_factor(csp);
return size;
}
static int x264_cli_pic_alloc(cli_pic_t *pic, int csp, int width, int height) {
int csp_mask, i;
memset(pic, 0, sizeof(cli_pic_t));
csp_mask = csp & X264_CSP_MASK;
if (x264_cli_csp_is_invalid(csp))
pic->img.planes = 0;
else
pic->img.planes = x264_cli_csps[csp_mask].planes;
pic->img.csp = csp;
pic->img.width = width;
pic->img.height = height;
for (i = 0; i < pic->img.planes; i++) {
pic->img.plane[i] = malloc(x264_cli_pic_plane_size(csp, width, height, i));
if (!pic->img.plane[i])
return -1;
pic->img.stride[i] = width * x264_cli_csps[csp_mask].width[i] * x264_cli_csp_depth_factor(csp);
}
return 0;
}
static void x264_cli_pic_clean(cli_pic_t *pic) {
int i;
for (i = 0; i < pic->img.planes; i++)
free(pic->img.plane[i]);
memset(pic, 0, sizeof(cli_pic_t));
}
static const x264_cli_csp_t *x264_cli_get_csp(int csp) {
if (x264_cli_csp_is_invalid(csp))
return NULL;
return x264_cli_csps + (csp & X264_CSP_MASK);
}
typedef struct
{
FILE *fh; /* input file handle */
int next_frame; /* next frame number */
uint64_t plane_size[4]; /* plane size in pixels */
uint64_t frame_size; /* frame size in bytes*/
} input_hnd_t;
static int open_file(char *psz_filename, void **p_handle, video_info_t *info) {
int i;
char *p;
const x264_cli_csp_t *csp;
input_hnd_t *h = calloc(1, sizeof(input_hnd_t));
if (!h)
return -1;
/* try to parse the file name to retrieve width and height */
for (p = psz_filename; *p; p++)
if (*p >= '0' && *p <= '9' && sscanf(p, "%dx%d", &info->width, &info->height) == 2)
break;
#ifdef DOWNSAMPLE
info->height /= SCALE;
info->width /= SCALE;
#endif
if (!info->width || !info->height)
return -1;
/* default color-space: I420 without high bit-depth */
info->csp = X264_CSP_I420;
info->num_frames = 0;
#ifndef BIN2C
if (!strcmp(psz_filename, "-"))
h->fh = stdin;
else
h->fh = fopen(psz_filename, "rb");
if (h->fh == NULL)
return -1;
#endif
csp = x264_cli_get_csp(info->csp);
for (i = 0; i < csp->planes; i++) {
h->plane_size[i] = x264_cli_pic_plane_size(info->csp, info->width, info->height, i);
h->frame_size += h->plane_size[i];
/* x264_cli_pic_plane_size returns the size in bytes, we need the value in pixels from here on */
h->plane_size[i] /= x264_cli_csp_depth_factor(info->csp);
}
if (h->frame_size > 0) {
#ifndef BIN2C
uint64_t i_size;
fseek(h->fh, 0, SEEK_END);
i_size = ftell(h->fh);
fseek(h->fh, 0, SEEK_SET);
info->num_frames = i_size / h->frame_size;
#else
info->num_frames = yuv_len / h->frame_size;
#endif
#ifdef DOWNSAMPLE
info->num_frames /= SCALE * SCALE;
#endif
}
*p_handle = h;
return 0;
}
static int read_frame_internal(cli_pic_t *pic, input_hnd_t *h) {
int error = 0;
int i;
int pixel_depth = x264_cli_csp_depth_factor(pic->img.csp);
size_t plane_size, height, width;
void *buf;
for (i = 0; i < pic->img.planes && !error; i++) {
plane_size = h->plane_size[i];
height = pic->img.height;
width = pic->img.width;
#ifdef DOWNSAMPLE
// only for YUV420
if (i > 0) {
height /= 2;
width /= 2;
}
plane_size *= SCALE * SCALE;
#endif
#ifndef BIN2C
buf = malloc(pixel_depth * plane_size);
error |= fread(buf, pixel_depth, plane_size, h->fh) != plane_size;
#else
buf = (void *)p_yuv;
#endif
#ifndef DOWNSAMPLE
memcpy((void *)pic->img.plane[i], buf, plane_size);
#elif DOWNSAMPLE == DOWNSAMPLE_BILINEAR
#if SCALE == 2
resize2((void *)pic->img.plane[i], buf, width, height);
#elif SCALE == 4
resize4((void *)pic->img.plane[i], buf, width, height);
#else
#error wrong SCALE for bilinear!
#endif
#elif DOWNSAMPLE == DOWNSAMPLE_BICUBIC
resize((void *)pic->img.plane[i], buf, width, height);
#else
#error wrong DOWNSAMPLE!
#endif
#ifndef BIN2C
free(buf);
#else
p_yuv += pixel_depth * plane_size;
#endif
}
return error;
}
static int read_frame(cli_pic_t *pic, void *handle, int i_frame) {
input_hnd_t *h = handle;
#ifndef BIN2C
if (i_frame > h->next_frame)
fseek(h->fh, i_frame * h->frame_size, SEEK_SET);
#endif
if (read_frame_internal(pic, h))
return -1;
h->next_frame = i_frame + 1;
return 0;
}
static int close_file(void *handle) {
#ifndef BIN2C
input_hnd_t *h = handle;
if (!h || !h->fh)
return 0;
fclose(h->fh);
free(h);
#endif
return 0;
}
const cli_input_t cli_input = {open_file, x264_cli_pic_alloc, read_frame, NULL, x264_cli_pic_clean, close_file};