mirror of
https://git.notmuchmail.org/git/notmuch
synced 2024-11-25 04:18:08 +01:00
hex-escape: (en|de)code strings to/from restricted character set
The character set is chosen to be suitable for pathnames, and the same as that used by contrib/nmbug [With additions by Jani Nikula]
This commit is contained in:
parent
113e30c01b
commit
902f2e19bd
3 changed files with 203 additions and 1 deletions
|
@ -3,7 +3,7 @@
|
||||||
dir := util
|
dir := util
|
||||||
extra_cflags += -I$(srcdir)/$(dir)
|
extra_cflags += -I$(srcdir)/$(dir)
|
||||||
|
|
||||||
libutil_c_srcs := $(dir)/xutil.c $(dir)/error_util.c
|
libutil_c_srcs := $(dir)/xutil.c $(dir)/error_util.c $(dir)/hex-escape.c
|
||||||
|
|
||||||
libutil_modules := $(libutil_c_srcs:.c=.o)
|
libutil_modules := $(libutil_c_srcs:.c=.o)
|
||||||
|
|
||||||
|
|
161
util/hex-escape.c
Normal file
161
util/hex-escape.c
Normal file
|
@ -0,0 +1,161 @@
|
||||||
|
/* hex-escape.c - Manage encoding and decoding of byte strings into path names
|
||||||
|
*
|
||||||
|
* Copyright (c) 2011 David Bremner
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU General Public License as published by
|
||||||
|
* the Free Software Foundation, either version 3 of the License, or
|
||||||
|
* (at your option) any later version.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU General Public License
|
||||||
|
* along with this program. If not, see http://www.gnu.org/licenses/ .
|
||||||
|
*
|
||||||
|
* Author: David Bremner <david@tethera.net>
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include <assert.h>
|
||||||
|
#include <string.h>
|
||||||
|
#include <talloc.h>
|
||||||
|
#include <ctype.h>
|
||||||
|
#include "error_util.h"
|
||||||
|
#include "hex-escape.h"
|
||||||
|
|
||||||
|
static const size_t default_buf_size = 1024;
|
||||||
|
|
||||||
|
static const char *output_charset =
|
||||||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+-_@=.,";
|
||||||
|
|
||||||
|
static const char escape_char = '%';
|
||||||
|
|
||||||
|
static int
|
||||||
|
is_output (char c)
|
||||||
|
{
|
||||||
|
return (strchr (output_charset, c) != NULL);
|
||||||
|
}
|
||||||
|
|
||||||
|
static int
|
||||||
|
maybe_realloc (void *ctx, size_t needed, char **out, size_t *out_size)
|
||||||
|
{
|
||||||
|
if (*out_size < needed) {
|
||||||
|
|
||||||
|
if (*out == NULL)
|
||||||
|
*out = talloc_size (ctx, needed);
|
||||||
|
else
|
||||||
|
*out = talloc_realloc (ctx, *out, char, needed);
|
||||||
|
|
||||||
|
if (*out == NULL)
|
||||||
|
return 0;
|
||||||
|
|
||||||
|
*out_size = needed;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
hex_status_t
|
||||||
|
hex_encode (void *ctx, const char *in, char **out, size_t *out_size)
|
||||||
|
{
|
||||||
|
|
||||||
|
const char *p;
|
||||||
|
char *q;
|
||||||
|
|
||||||
|
size_t needed = 1; /* for the NUL */
|
||||||
|
|
||||||
|
assert (ctx); assert (in); assert (out); assert (out_size);
|
||||||
|
|
||||||
|
for (p = in; *p; p++) {
|
||||||
|
needed += is_output (*p) ? 1 : 3;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (*out == NULL)
|
||||||
|
*out_size = 0;
|
||||||
|
|
||||||
|
if (!maybe_realloc (ctx, needed, out, out_size))
|
||||||
|
return HEX_OUT_OF_MEMORY;
|
||||||
|
|
||||||
|
q = *out;
|
||||||
|
p = in;
|
||||||
|
|
||||||
|
while (*p) {
|
||||||
|
if (is_output (*p)) {
|
||||||
|
*q++ = *p++;
|
||||||
|
} else {
|
||||||
|
sprintf (q, "%%%02x", (unsigned char)*p++);
|
||||||
|
q += 3;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
*q = '\0';
|
||||||
|
return HEX_SUCCESS;
|
||||||
|
}
|
||||||
|
|
||||||
|
/* Hex decode 'in' to 'out'.
|
||||||
|
*
|
||||||
|
* This must succeed for in == out to support hex_decode_inplace().
|
||||||
|
*/
|
||||||
|
static hex_status_t
|
||||||
|
hex_decode_internal (const char *in, unsigned char *out)
|
||||||
|
{
|
||||||
|
char buf[3];
|
||||||
|
|
||||||
|
while (*in) {
|
||||||
|
if (*in == escape_char) {
|
||||||
|
char *endp;
|
||||||
|
|
||||||
|
/* This also handles unexpected end-of-string. */
|
||||||
|
if (!isxdigit ((unsigned char) in[1]) ||
|
||||||
|
!isxdigit ((unsigned char) in[2]))
|
||||||
|
return HEX_SYNTAX_ERROR;
|
||||||
|
|
||||||
|
buf[0] = in[1];
|
||||||
|
buf[1] = in[2];
|
||||||
|
buf[2] = '\0';
|
||||||
|
|
||||||
|
*out = strtoul (buf, &endp, 16);
|
||||||
|
|
||||||
|
if (endp != buf + 2)
|
||||||
|
return HEX_SYNTAX_ERROR;
|
||||||
|
|
||||||
|
in += 3;
|
||||||
|
out++;
|
||||||
|
} else {
|
||||||
|
*out++ = *in++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
*out = '\0';
|
||||||
|
|
||||||
|
return HEX_SUCCESS;
|
||||||
|
}
|
||||||
|
|
||||||
|
hex_status_t
|
||||||
|
hex_decode_inplace (char *s)
|
||||||
|
{
|
||||||
|
/* A decoded string is never longer than the encoded one, so it is
|
||||||
|
* safe to decode a string onto itself. */
|
||||||
|
return hex_decode_internal (s, (unsigned char *) s);
|
||||||
|
}
|
||||||
|
|
||||||
|
hex_status_t
|
||||||
|
hex_decode (void *ctx, const char *in, char **out, size_t * out_size)
|
||||||
|
{
|
||||||
|
const char *p;
|
||||||
|
size_t needed = 1; /* for the NUL */
|
||||||
|
|
||||||
|
assert (ctx); assert (in); assert (out); assert (out_size);
|
||||||
|
|
||||||
|
for (p = in; *p; p++)
|
||||||
|
if ((p[0] == escape_char) && isxdigit (p[1]) && isxdigit (p[2]))
|
||||||
|
needed -= 1;
|
||||||
|
else
|
||||||
|
needed += 1;
|
||||||
|
|
||||||
|
if (!maybe_realloc (ctx, needed, out, out_size))
|
||||||
|
return HEX_OUT_OF_MEMORY;
|
||||||
|
|
||||||
|
return hex_decode_internal (in, (unsigned char *) *out);
|
||||||
|
}
|
41
util/hex-escape.h
Normal file
41
util/hex-escape.h
Normal file
|
@ -0,0 +1,41 @@
|
||||||
|
#ifndef _HEX_ESCAPE_H
|
||||||
|
#define _HEX_ESCAPE_H
|
||||||
|
|
||||||
|
typedef enum hex_status {
|
||||||
|
HEX_SUCCESS = 0,
|
||||||
|
HEX_SYNTAX_ERROR,
|
||||||
|
HEX_OUT_OF_MEMORY
|
||||||
|
} hex_status_t;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* The API for hex_encode() and hex_decode() is modelled on that for
|
||||||
|
* getline.
|
||||||
|
*
|
||||||
|
* If 'out' points to a NULL pointer a char array of the appropriate
|
||||||
|
* size is allocated using talloc, and out_size is updated.
|
||||||
|
*
|
||||||
|
* If 'out' points to a non-NULL pointer, it assumed to describe an
|
||||||
|
* existing char array, with the size given in *out_size. This array
|
||||||
|
* may be resized by talloc_realloc if needed; in this case *out_size
|
||||||
|
* will also be updated.
|
||||||
|
*
|
||||||
|
* Note that it is an error to pass a NULL pointer for any parameter
|
||||||
|
* of these routines.
|
||||||
|
*/
|
||||||
|
|
||||||
|
hex_status_t
|
||||||
|
hex_encode (void *talloc_ctx, const char *in, char **out,
|
||||||
|
size_t *out_size);
|
||||||
|
|
||||||
|
hex_status_t
|
||||||
|
hex_decode (void *talloc_ctx, const char *in, char **out,
|
||||||
|
size_t *out_size);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Non-allocating hex decode to decode 's' in-place. The length of the
|
||||||
|
* result is always equal to or shorter than the length of the
|
||||||
|
* original.
|
||||||
|
*/
|
||||||
|
hex_status_t
|
||||||
|
hex_decode_inplace (char *s);
|
||||||
|
#endif
|
Loading…
Reference in a new issue