aboutsummaryrefslogblamecommitdiffstats
path: root/mail/e-http-request.c
blob: ba8b1f5a13f8a3e2ba48f904ff75c30ffe585a09 (plain) (tree)



























                                                                             
                                  





















                                                               

                    


























































                                                                                     
                                















                                                                            
                                        






                                                                                              
                                              
                                        






                                                                                      
                                              
                                        









                                                                                    
                                        




































                                                                                           








                                            















































































































                                                                                               
                          












                                                                                     
                                          






















                                                                                          


                                                                      




                                                                                 






                                                                                  











































































































































































                                                                                            
/*
 * e-http-request.c
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) version 3.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with the program; if not, see <http://www.gnu.org/licenses/>
 *
 */

#include "e-http-request.h"

#define LIBSOUP_USE_UNSTABLE_REQUEST_API
#include <libsoup/soup.h>
#include <libsoup/soup-requester.h>
#include <libsoup/soup-request-http.h>
#include <camel/camel.h>
#include <webkit/webkit.h>

#include <e-util/e-util.h>
#include <libedataserver/e-flag.h>

#include <string.h>

#include "em-format-html.h"


#define d(x)

#define E_HTTP_REQUEST_GET_PRIVATE(obj) \
    (G_TYPE_INSTANCE_GET_PRIVATE \
    ((obj), E_TYPE_HTTP_REQUEST, EHTTPRequestPrivate))

struct _EHTTPRequestPrivate {
    gchar *content_type;
    gint content_length;

    EMFormatHTML *efh;
};

G_DEFINE_TYPE (EHTTPRequest, e_http_request, SOUP_TYPE_REQUEST)

struct http_request_async_data {
    EFlag *flag;

    GMainLoop *loop;
    GCancellable *cancellable;
    CamelDataCache *cache;
    gchar *cache_key;

    CamelStream *cache_stream;
    gchar *content_type;
    goffset content_length;

    gchar *buff;
};

static void
http_request_write_to_cache (GInputStream *stream,
                             GAsyncResult *res,
                             struct http_request_async_data *data)
{
    GError *error;
    gssize len;

    error = NULL;
    len = g_input_stream_read_finish (stream, res, &error);

    /* Error while reading data */
    if (len == -1) {
        if (!g_error_matches (error, G_IO_ERROR, G_IO_ERROR_CANCELLED)) {
            g_message ("Error while reading input stream: %s",
                error ? error->message : "Unknown error");
            g_clear_error (&error);
        }

        /* Don't keep broken data in cache */
        camel_data_cache_remove (data->cache, "http", data->cache_key, NULL);

        goto cleanup;
    }

    /* EOF */
    if (len == 0) {
        goto cleanup;
    }

    /* Write chunk to cache and read another block of data. */
    camel_stream_write (data->cache_stream, data->buff, len,
        data->cancellable, NULL);

    g_input_stream_read_async (stream, data->buff, 4096,
        G_PRIORITY_DEFAULT, data->cancellable,
        (GAsyncReadyCallback) http_request_write_to_cache, data);

    return;

 cleanup:
    if (data->buff)
        g_free (data->buff);

    g_object_unref (stream);

    g_main_loop_quit (data->loop);
    e_flag_set (data->flag);
}

static void
http_request_finished (SoupRequest *request,
                       GAsyncResult *res,
                       struct http_request_async_data *data)
{
    GError *error;
    SoupMessage *message;
    GInputStream *stream;

    error = NULL;
    stream = soup_request_send_finish (request, res, &error);
    /* If there is an error or the operation was canceled, do nothing */
    if (error) {
        g_main_loop_quit (data->loop);
        e_flag_set (data->flag);
        g_error_free (error);
        return;
    }

    if (!stream) {
        g_warning("HTTP request failed: %s", error ? error->message: "Unknown error");
        g_clear_error (&error);
        g_main_loop_quit (data->loop);
        e_flag_set (data->flag);
        return;
    }

    message = soup_request_http_get_message (SOUP_REQUEST_HTTP (request));
    if (!SOUP_STATUS_IS_SUCCESSFUL (message->status_code)) {
        g_warning ("HTTP request failed: HTTP code %d", message->status_code);
        g_object_unref (message);
        g_main_loop_quit (data->loop);
        e_flag_set (data->flag);
        return;
    }

    g_object_unref (message);

    data->content_length = soup_request_get_content_length (request);
    data->content_type = g_strdup (soup_request_get_content_type (request));

    if (!data->cache_stream || g_cancellable_is_cancelled (data->cancellable)) {
        g_main_loop_quit (data->loop);
        e_flag_set (data->flag);
        return;
    }

    data->buff = g_malloc (4096);
    g_input_stream_read_async (stream, data->buff, 4096,
        G_PRIORITY_DEFAULT, data->cancellable,
        (GAsyncReadyCallback) http_request_write_to_cache, data);
}

static gssize
copy_stream_to_stream (CamelStream *input,
               GMemoryInputStream *output,
               GCancellable *cancellable)
{
    gchar *buff;
    gssize read_len = 0;
    gssize total_len = 0;

    g_seekable_seek (G_SEEKABLE (input), 0, G_SEEK_SET, cancellable, NULL);

    buff = g_malloc (4096);
    while ((read_len = camel_stream_read (input, buff, 4096, cancellable, NULL)) > 0) {

        g_memory_input_stream_add_data (output, buff, read_len, g_free);

        total_len += read_len;

        buff = g_malloc (4096);
    }

    /* Free the last unused buffer */
    g_free (buff);

    return total_len;
}

static void
quit_main_loop (GCancellable *cancellable,
            GMainLoop *loop)
{
    if (g_main_loop_is_running (loop)) {
        g_main_loop_quit (loop);
    }
}

static void
handle_http_request (GSimpleAsyncResult *res,
                     GObject *object,
                     GCancellable *cancellable)
{
    EHTTPRequest *request = E_HTTP_REQUEST (object);
    SoupURI *soup_uri;
    gchar *evo_uri, *uri;
    GInputStream *stream;
    gboolean force_load_images = FALSE;
    gchar *uri_md5;

    const gchar *user_cache_dir;
    CamelDataCache *cache;
    CamelStream *cache_stream;

    GHashTable *query;

    if (g_cancellable_is_cancelled (cancellable)) {
        return;
    }

    /* Remove the __evo-mail query */
    soup_uri = soup_request_get_uri (SOUP_REQUEST (request));
    query = soup_form_decode (soup_uri->query);
    g_hash_table_remove (query, "__evo-mail");

    /* Remove __evo-load-images if present (and in such case set
     * force_load_images to TRUE) */
    force_load_images = g_hash_table_remove (query, "__evo-load-images");

    soup_uri_set_query_from_form (soup_uri, query);
    g_hash_table_unref (query);

    evo_uri = soup_uri_to_string (soup_uri, FALSE);

    /* Remove the "evo-" prefix from scheme */
    if (evo_uri && (strlen (evo_uri) > 5)) {
        uri = g_strdup (&evo_uri[4]);
        g_free (evo_uri);
    }

    g_return_if_fail (uri && *uri);

    /* Use MD5 hash of the URI as a filname of the resourec cache file.
     * We were previously using the URI as a filename but the URI is
     * sometimes too long for a filename. */
    uri_md5 = g_compute_checksum_for_string (G_CHECKSUM_MD5, uri, -1);

    /* Open Evolution's cache */
    user_cache_dir = e_get_user_cache_dir ();
    cache = camel_data_cache_new (user_cache_dir, NULL);
    if (cache) {
        camel_data_cache_set_expire_age (cache, 24 * 60 * 60);
        camel_data_cache_set_expire_access (cache, 2 * 60 * 60);
    }

    /* Found item in cache! */
    cache_stream = camel_data_cache_get (cache, "http", uri_md5, NULL);
    if (cache_stream) {

        gssize len;

        stream = g_memory_input_stream_new ();

        len = copy_stream_to_stream (cache_stream,
                   G_MEMORY_INPUT_STREAM (stream), cancellable);
        request->priv->content_length = len;

        g_object_unref (cache_stream);

        /* When succesfully read some data from cache then
         * get mimetype and return the stream to WebKit.
         * Otherwise try to fetch the resource again from the network. */
        if ((len != -1) && (request->priv->content_length > 0)) {
            GFile *file;
            GFileInfo *info;
            gchar *path;

            path = camel_data_cache_get_filename (cache, "http", uri_md5, NULL);
            file = g_file_new_for_path (path);
            info = g_file_query_info (file, G_FILE_ATTRIBUTE_STANDARD_CONTENT_TYPE,
                    0, cancellable, NULL);

            request->priv->content_type = g_strdup (
                g_file_info_get_content_type (info));

            d(printf ("'%s' found in cache (%d bytes, %s)\n",
                uri, request->priv->content_length,
                request->priv->content_type));

            g_object_unref (info);
            g_object_unref (file);
            g_free (path);

            /* Set result and quit the thread */
            g_simple_async_result_set_op_res_gpointer (res, stream, NULL);

            goto cleanup;
        } else {
            d(printf("Failed to load '%s' from cache.\n", uri));
        }
    }

    /* Item not found in cache, but image loading policy allows us to fetch
     * it from the interwebs */
    if (force_load_images || em_format_html_can_load_images (request->priv->efh)) {

        SoupRequester *requester;
        SoupRequest *http_request;
        SoupSession *session;
        GMainContext *context;
        GError *error;
        gulong id;

        struct http_request_async_data data = { 0 };

        context = g_main_context_get_thread_default ();
        session = soup_session_async_new_with_options (
                    SOUP_SESSION_ASYNC_CONTEXT, context, NULL);

        requester = soup_requester_new ();
        soup_session_add_feature (session, SOUP_SESSION_FEATURE (requester));

        http_request = soup_requester_request (requester, uri, NULL);

        error = NULL;
        data.flag = e_flag_new ();
        data.loop = g_main_loop_new (context, TRUE);
        data.cancellable = cancellable;
        data.cache = cache;
        data.cache_key = uri_md5;
        data.cache_stream = camel_data_cache_add (cache, "http", uri_md5, &error);

        if (!data.cache_stream) {
            g_warning ("Failed to create cache file for '%s': %s",
                uri, error ? error->message : "Unknown error");
            g_clear_error (&error);

            /* We rely on existence of the stream. If CamelDataCache
             * failed to create a cache file, then store it at least
             * temporarily. */
            data.cache_stream = camel_stream_mem_new ();
        }

        /* Send the request and waint in mainloop until it's finished
         * and copied to cache */
        d(printf(" '%s' not in cache, sending HTTP request\n", uri));
        soup_request_send_async (http_request, cancellable,
            (GAsyncReadyCallback) http_request_finished, &data);

        id = g_cancellable_connect (cancellable,
            G_CALLBACK (quit_main_loop), data.loop, NULL);

        /* Wait for the asynchronous HTTP GET to finish */
        g_main_loop_run (data.loop);
        d(printf (" '%s' fetched from internet and (hopefully) stored in"
              " cache\n", uri));

        g_cancellable_disconnect (cancellable, id);

        /* Wait until all asynchronous operations are finished working
           with the 'data' structure so that it's not free'd too early. */
        e_flag_wait (data.flag);
        e_flag_free (data.flag);

        g_main_loop_unref (data.loop);

        g_object_unref (session);
        g_object_unref (http_request);
        g_object_unref (requester);

        /* Copy the content of cache stream to GInputStream that can be
         * returned to WebKit */
        stream = g_memory_input_stream_new ();
        copy_stream_to_stream (data.cache_stream,
            G_MEMORY_INPUT_STREAM (stream), cancellable);

        camel_stream_close (data.cache_stream, cancellable, NULL);
        g_object_unref (data.cache_stream);

        request->priv->content_length = data.content_length;
        request->priv->content_type = data.content_type;

        g_simple_async_result_set_op_res_gpointer (res, stream, NULL);

        goto cleanup;

    }

 cleanup:
    g_free (uri);
    g_free (uri_md5);
}

static void
http_request_finalize (GObject *object)
{
    EHTTPRequest *request = E_HTTP_REQUEST (object);

    if (request->priv->content_type) {
        g_free (request->priv->content_type);
        request->priv->content_type = NULL;
    }

    if (request->priv->efh) {
        g_object_unref (request->priv->efh);
        request->priv->efh = NULL;
    }

    G_OBJECT_CLASS (e_http_request_parent_class)->finalize (object);
}

static gboolean
http_request_check_uri (SoupRequest *request,
                       SoupURI *uri,
                       GError **error)
{
    return ((strcmp (uri->scheme, "evo-http") == 0) ||
        (strcmp (uri->scheme, "evo-https") == 0));
}

static void
http_request_send_async (SoupRequest *request,
                         GCancellable *cancellable,
                         GAsyncReadyCallback callback,
                         gpointer user_data)
{
    EHTTPRequest *ehr;
    GSimpleAsyncResult *result;
    gchar *mail_uri;
    SoupURI *uri;
    const gchar *enc;
    SoupSession *session;
    GHashTable *formatters, *query;

    ehr = E_HTTP_REQUEST (request);
    uri = soup_request_get_uri (request);
    query = soup_form_decode (uri->query);

    d(printf("received request for %s\n", soup_uri_to_string (uri, FALSE)));

    enc = g_hash_table_lookup (query, "__evo-mail");

    if (!enc || !*enc) {
        g_hash_table_destroy (query);
        return;
    }

    mail_uri = soup_uri_decode (enc);

    session = webkit_get_default_session ();
    formatters = g_object_get_data (G_OBJECT (session), "formatters");
    g_return_if_fail (formatters != NULL);

    ehr->priv->efh = g_hash_table_lookup (formatters, mail_uri);
    g_free (mail_uri);

    g_return_if_fail (ehr->priv->efh);

    /* Make sure the formatter lives until we are finished here */
    g_object_ref (ehr->priv->efh);

    result = g_simple_async_result_new (G_OBJECT (request), callback,
            user_data, http_request_send_async);
    g_simple_async_result_run_in_thread (result, handle_http_request,
            G_PRIORITY_DEFAULT, cancellable);

    g_hash_table_destroy (query);
}

static GInputStream *
http_request_send_finish (SoupRequest *request,
                          GAsyncResult *result,
                          GError **error)
{
    GInputStream *stream;

    stream = g_simple_async_result_get_op_res_gpointer (G_SIMPLE_ASYNC_RESULT (result));
    g_object_unref (result);

    /* Reset the stream before passing it back to webkit */
    if (stream && G_IS_SEEKABLE (stream))
        g_seekable_seek (G_SEEKABLE (stream), 0, G_SEEK_SET, NULL, NULL);

    if (!stream) /* We must always return something */
        stream = g_memory_input_stream_new ();

    return stream;
}

static goffset
http_request_get_content_length (SoupRequest *request)
{
    EHTTPRequest *efr = E_HTTP_REQUEST (request);

    d(printf("Content-Length: %d bytes\n", efr->priv->content_length));
    return efr->priv->content_length;
}

static const gchar *
http_request_get_content_type (SoupRequest *request)
{
    EHTTPRequest *efr = E_HTTP_REQUEST (request);

    d(printf("Content-Type: %s\n", efr->priv->content_type));

    return efr->priv->content_type;
}

static const gchar *data_schemes[] = { "evo-http", "evo-https", NULL };

static void
e_http_request_class_init (EHTTPRequestClass *class)
{
    GObjectClass *object_class;
    SoupRequestClass *request_class;

    g_type_class_add_private (class, sizeof (EHTTPRequestPrivate));

    object_class = G_OBJECT_CLASS (class);
    object_class->finalize = http_request_finalize;

    request_class = SOUP_REQUEST_CLASS (class);
    request_class->schemes = data_schemes;
    request_class->send_async = http_request_send_async;
    request_class->send_finish = http_request_send_finish;
    request_class->get_content_type = http_request_get_content_type;
    request_class->get_content_length = http_request_get_content_length;
    request_class->check_uri = http_request_check_uri;
}

static void
e_http_request_init (EHTTPRequest *request)
{
    request->priv = E_HTTP_REQUEST_GET_PRIVATE (request);
}