input_curl: buffered rewinding
During codec detection, the beginning of the stream is consumed. This is a common operation, which takes a lot of time when handling remote resources. To optimize this, remember the first 64 kB of a stream. This way, we can rewind the stream without actually fetching the start of the stream again.
This commit is contained in:
parent
020c04e702
commit
460b15d29c
116
src/input_curl.c
116
src/input_curl.c
@ -29,6 +29,9 @@
|
||||
#include <curl/curl.h>
|
||||
#include <glib.h>
|
||||
|
||||
/** rewinding is possible after up to 64 kB */
|
||||
static const off_t max_rewind_size = 64 * 1024;
|
||||
|
||||
/**
|
||||
* Buffers created by input_curl_writefunction().
|
||||
*/
|
||||
@ -64,6 +67,9 @@ struct input_curl {
|
||||
|
||||
/** did libcurl tell us the we're at the end of the response body? */
|
||||
bool eof;
|
||||
|
||||
/** limited list of old buffers, for rewinding */
|
||||
struct list_head rewind;
|
||||
};
|
||||
|
||||
/** libcurl should accept "ICY 200 OK" */
|
||||
@ -111,6 +117,13 @@ input_curl_easy_free(struct input_curl *c)
|
||||
|
||||
g_free(buffer);
|
||||
}
|
||||
|
||||
while (!list_empty(&c->rewind)) {
|
||||
struct buffer *buffer = (struct buffer *)c->rewind.next;
|
||||
list_del(&buffer->siblings);
|
||||
|
||||
g_free(buffer);
|
||||
}
|
||||
}
|
||||
|
||||
/**
|
||||
@ -169,7 +182,8 @@ input_curl_select(struct input_curl *c)
|
||||
}
|
||||
|
||||
static size_t
|
||||
read_from_buffer(struct buffer *buffer, void *dest, size_t length)
|
||||
read_from_buffer(struct buffer *buffer, void *dest, size_t length,
|
||||
struct list_head *rewind_head)
|
||||
{
|
||||
assert(buffer->size > 0);
|
||||
assert(buffer->consumed < buffer->size);
|
||||
@ -182,6 +196,11 @@ read_from_buffer(struct buffer *buffer, void *dest, size_t length)
|
||||
buffer->consumed += length;
|
||||
if (buffer->consumed == buffer->size) {
|
||||
list_del(&buffer->siblings);
|
||||
|
||||
if (rewind_head != NULL)
|
||||
/* append this buffer to the rewind buffer list */
|
||||
list_add_tail(&buffer->siblings, rewind_head);
|
||||
else
|
||||
g_free(buffer);
|
||||
}
|
||||
|
||||
@ -193,6 +212,7 @@ input_curl_read(struct input_stream *is, void *ptr, size_t size)
|
||||
{
|
||||
struct input_curl *c = is->data;
|
||||
CURLMcode mcode = CURLM_CALL_MULTI_PERFORM;
|
||||
struct list_head *rewind_head;
|
||||
size_t nbytes = 0;
|
||||
char *dest = ptr;
|
||||
|
||||
@ -223,15 +243,37 @@ input_curl_read(struct input_stream *is, void *ptr, size_t size)
|
||||
|
||||
/* send buffer contents */
|
||||
|
||||
if (!list_empty(&c->rewind) || is->offset == 0)
|
||||
/* at the beginning or already writing the rewind
|
||||
buffer list */
|
||||
rewind_head = &c->rewind;
|
||||
else
|
||||
/* we don't need the rewind buffers anymore */
|
||||
rewind_head = NULL;
|
||||
|
||||
while (size > 0 && !list_empty(&c->buffers)) {
|
||||
struct buffer *buffer = (struct buffer *)c->buffers.next;
|
||||
size_t copy = read_from_buffer(buffer, dest + nbytes, size);
|
||||
size_t copy = read_from_buffer(buffer, dest + nbytes, size,
|
||||
rewind_head);
|
||||
|
||||
nbytes += copy;
|
||||
size -= copy;
|
||||
}
|
||||
|
||||
is->offset += (off_t)nbytes;
|
||||
|
||||
if (rewind_head != NULL && is->offset > max_rewind_size) {
|
||||
/* drop the rewind buffer, it has grown too large */
|
||||
|
||||
while (!list_empty(&c->rewind)) {
|
||||
struct buffer *buffer =
|
||||
(struct buffer *)c->rewind.next;
|
||||
list_del(&buffer->siblings);
|
||||
|
||||
g_free(buffer);
|
||||
}
|
||||
}
|
||||
|
||||
return nbytes;
|
||||
}
|
||||
|
||||
@ -413,12 +455,81 @@ input_curl_send_request(struct input_curl *c)
|
||||
return true;
|
||||
}
|
||||
|
||||
static bool
|
||||
input_curl_can_rewind(struct input_stream *is)
|
||||
{
|
||||
struct input_curl *c = is->data;
|
||||
struct buffer *buffer;
|
||||
|
||||
if (!list_empty(&c->rewind))
|
||||
/* the rewind buffer hasn't been wiped yet */
|
||||
return true;
|
||||
|
||||
if (list_empty(&c->buffers))
|
||||
/* there are no buffers at all - cheap rewind not
|
||||
possible */
|
||||
return false;
|
||||
|
||||
/* rewind is possible if this is the very first buffer of the
|
||||
resource */
|
||||
buffer = (struct buffer*)c->buffers.next;
|
||||
return (off_t)buffer->consumed == is->offset;
|
||||
}
|
||||
|
||||
static void
|
||||
input_curl_rewind(struct input_stream *is)
|
||||
{
|
||||
struct input_curl *c = is->data;
|
||||
struct buffer *buffer;
|
||||
#ifndef NDEBUG
|
||||
off_t offset = 0;
|
||||
#endif
|
||||
|
||||
/* reset all rewind buffers */
|
||||
|
||||
list_for_each_entry(buffer, &c->rewind, siblings) {
|
||||
#ifndef NDEBUG
|
||||
offset += buffer->consumed;
|
||||
#endif
|
||||
buffer->consumed = 0;
|
||||
}
|
||||
|
||||
/* rewind the current buffer */
|
||||
|
||||
if (!list_empty(&c->buffers)) {
|
||||
buffer = (struct buffer*)c->buffers.next;
|
||||
#ifndef NDEBUG
|
||||
offset += buffer->consumed;
|
||||
#endif
|
||||
buffer->consumed = 0;
|
||||
}
|
||||
|
||||
assert(offset == is->offset);
|
||||
|
||||
/* move all rewind buffers back to the regular buffer list */
|
||||
|
||||
list_splice_init(&c->rewind, &c->buffers);
|
||||
is->offset = 0;
|
||||
}
|
||||
|
||||
static bool
|
||||
input_curl_seek(struct input_stream *is, off_t offset, int whence)
|
||||
{
|
||||
struct input_curl *c = is->data;
|
||||
bool ret;
|
||||
|
||||
if (whence == SEEK_SET && offset == 0) {
|
||||
if (is->offset == 0)
|
||||
/* no-op */
|
||||
return true;
|
||||
|
||||
if (input_curl_can_rewind(is)) {
|
||||
/* we have enough rewind buffers left */
|
||||
input_curl_rewind(is);
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
if (!is->seekable)
|
||||
return false;
|
||||
|
||||
@ -478,6 +589,7 @@ input_curl_open(struct input_stream *is, const char *url)
|
||||
c = g_new0(struct input_curl, 1);
|
||||
c->url = g_strdup(url);
|
||||
INIT_LIST_HEAD(&c->buffers);
|
||||
INIT_LIST_HEAD(&c->rewind);
|
||||
|
||||
is->data = c;
|
||||
|
||||
|
Loading…
Reference in New Issue
Block a user