mirror of
https://git.pwmt.org/pwmt/zathura.git
synced 2024-11-10 23:13:48 +01:00
5021767a18
… and use it everywhere we want to get the content type of a file. Signed-off-by: Sebastian Ramacher <sebastian+dev@ramacher.at>
174 lines
4.0 KiB
C
174 lines
4.0 KiB
C
/* See LICENSE file for license and copyright information */
|
|
|
|
#define _BSD_SOURCE
|
|
#define _XOPEN_SOURCE 700
|
|
|
|
#include "content-type.h"
|
|
#include "macros.h"
|
|
|
|
#include <girara/utils.h>
|
|
#ifdef WITH_MAGIC
|
|
#include <magic.h>
|
|
#else
|
|
#include <sys/types.h>
|
|
#include <sys/wait.h>
|
|
#endif
|
|
#include <stdio.h>
|
|
#include <glib.h>
|
|
#include <gio/gio.h>
|
|
|
|
/** Read a most GT_MAX_READ bytes before falling back to file. */
|
|
static const size_t GT_MAX_READ = 1 << 16;
|
|
|
|
#ifdef WITH_MAGIC
|
|
static const char*
|
|
guess_type_magic(const char* path) {
|
|
const char* mime_type = NULL;
|
|
|
|
/* creat magic cookie */
|
|
const int flags =
|
|
MAGIC_MIME_TYPE |
|
|
MAGIC_SYMLINK |
|
|
MAGIC_NO_CHECK_APPTYPE |
|
|
MAGIC_NO_CHECK_CDF |
|
|
MAGIC_NO_CHECK_ELF |
|
|
MAGIC_NO_CHECK_ENCODING;
|
|
magic_t magic = magic_open(flags);
|
|
if (magic == NULL) {
|
|
girara_debug("failed creating the magic cookie");
|
|
goto cleanup;
|
|
}
|
|
|
|
/* ... and load mime database */
|
|
if (magic_load(magic, NULL) < 0) {
|
|
girara_debug("failed loading the magic database: %s", magic_error(magic));
|
|
goto cleanup;
|
|
}
|
|
|
|
/* get the mime type */
|
|
mime_type = magic_file(magic, path);
|
|
if (mime_type == NULL) {
|
|
girara_debug("failed guessing filetype: %s", magic_error(magic));
|
|
goto cleanup;
|
|
}
|
|
/* dup so we own the memory */
|
|
mime_type = g_strdup(mime_type);
|
|
|
|
girara_debug("magic detected filetype: %s", mime_type);
|
|
|
|
cleanup:
|
|
if (magic != NULL) {
|
|
magic_close(magic);
|
|
}
|
|
|
|
return mime_type;
|
|
}
|
|
|
|
static const char*
|
|
guess_type_file(const char* UNUSED(path))
|
|
{
|
|
return NULL;
|
|
}
|
|
#else
|
|
static const char*
|
|
guess_type_magic(const char* UNUSED(path)) {
|
|
return NULL;
|
|
}
|
|
|
|
static const char*
|
|
guess_type_file(const char* path)
|
|
{
|
|
GString* command = g_string_new("file -b --mime-type ");
|
|
char* tmp = g_shell_quote(path);
|
|
|
|
g_string_append(command, tmp);
|
|
g_free(tmp);
|
|
|
|
GError* error = NULL;
|
|
char* out = NULL;
|
|
int ret = 0;
|
|
g_spawn_command_line_sync(command->str, &out, NULL, &ret, &error);
|
|
g_string_free(command, TRUE);
|
|
if (error != NULL) {
|
|
girara_warning("failed to execute command: %s", error->message);
|
|
g_error_free(error);
|
|
g_free(out);
|
|
return NULL;
|
|
}
|
|
if (WEXITSTATUS(ret) != 0) {
|
|
girara_warning("file failed with error code: %d", WEXITSTATUS(ret));
|
|
g_free(out);
|
|
return NULL;
|
|
}
|
|
|
|
g_strdelimit(out, "\n\r", '\0');
|
|
return out;
|
|
}
|
|
#endif
|
|
|
|
static const char*
|
|
guess_type_glib(const char* path)
|
|
{
|
|
gboolean uncertain = FALSE;
|
|
const char* content_type = g_content_type_guess(path, NULL, 0, &uncertain);
|
|
if (content_type == NULL) {
|
|
girara_debug("g_content_type failed\n");
|
|
} else {
|
|
if (uncertain == FALSE) {
|
|
girara_debug("g_content_type detected filetype: %s", content_type);
|
|
return content_type;
|
|
}
|
|
girara_debug("g_content_type is uncertain, guess: %s", content_type);
|
|
}
|
|
|
|
FILE* f = fopen(path, "rb");
|
|
if (f == NULL) {
|
|
return NULL;
|
|
}
|
|
|
|
const int fd = fileno(f);
|
|
guchar* content = NULL;
|
|
size_t length = 0u;
|
|
ssize_t bytes_read = -1;
|
|
while (uncertain == TRUE && length < GT_MAX_READ && bytes_read != 0) {
|
|
g_free((void*)content_type);
|
|
content_type = NULL;
|
|
|
|
content = g_realloc(content, length + BUFSIZ);
|
|
bytes_read = read(fd, content + length, BUFSIZ);
|
|
if (bytes_read == -1) {
|
|
break;
|
|
}
|
|
|
|
length += bytes_read;
|
|
content_type = g_content_type_guess(NULL, content, length, &uncertain);
|
|
girara_debug("new guess: %s uncertain: %d, read: %zu", content_type, uncertain, length);
|
|
}
|
|
|
|
fclose(f);
|
|
g_free(content);
|
|
if (uncertain == FALSE) {
|
|
return content_type;
|
|
}
|
|
|
|
g_free((void*)content_type);
|
|
return NULL;
|
|
}
|
|
|
|
const char*
|
|
guess_content_type(const char* path)
|
|
{
|
|
/* try libmagic first */
|
|
const char* content_type = guess_type_magic(path);
|
|
if (content_type != NULL) {
|
|
return content_type;
|
|
}
|
|
/* else fallback to g_content_type_guess method */
|
|
content_type = guess_type_glib(path);
|
|
if (content_type != NULL) {
|
|
return content_type;
|
|
}
|
|
/* and if libmagic is not available, try file as last resort */
|
|
return guess_type_file(path);
|
|
}
|