GIcon: add g_icon_[de]serialize()
[glib.git] / gio / gcharsetconverter.c
blobc7f480757c78fa772ef4ffcfcc53cc3c47a0a540
1 /* GIO - GLib Input, Output and Streaming Library
3 * Copyright (C) 2009 Red Hat, Inc.
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Lesser General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
15 * You should have received a copy of the GNU Lesser General
16 * Public License along with this library; if not, write to the
17 * Free Software Foundation, Inc., 59 Temple Place, Suite 330,
18 * Boston, MA 02111-1307, USA.
20 * Author: Alexander Larsson <alexl@redhat.com>
23 #include "config.h"
25 #include "gcharsetconverter.h"
27 #include <errno.h>
29 #include "ginitable.h"
30 #include "gioerror.h"
31 #include "glibintl.h"
34 enum {
35 PROP_0,
36 PROP_FROM_CHARSET,
37 PROP_TO_CHARSET,
38 PROP_USE_FALLBACK
41 /**
42 * SECTION:gcharsetconverter
43 * @short_description: Convert between charsets
44 * @include: gio/gio.h
46 * #GCharsetConverter is an implementation of #GConverter based on
47 * GIConv.
50 static void g_charset_converter_iface_init (GConverterIface *iface);
51 static void g_charset_converter_initable_iface_init (GInitableIface *iface);
53 /**
54 * GCharsetConverter:
56 * Conversions between character sets.
58 struct _GCharsetConverter
60 GObject parent_instance;
62 char *from;
63 char *to;
64 GIConv iconv;
65 gboolean use_fallback;
66 guint n_fallback_errors;
69 G_DEFINE_TYPE_WITH_CODE (GCharsetConverter, g_charset_converter, G_TYPE_OBJECT,
70 G_IMPLEMENT_INTERFACE (G_TYPE_CONVERTER,
71 g_charset_converter_iface_init);
72 G_IMPLEMENT_INTERFACE (G_TYPE_INITABLE,
73 g_charset_converter_initable_iface_init))
75 static void
76 g_charset_converter_finalize (GObject *object)
78 GCharsetConverter *conv;
80 conv = G_CHARSET_CONVERTER (object);
82 g_free (conv->from);
83 g_free (conv->to);
84 if (conv->iconv)
85 g_iconv_close (conv->iconv);
87 G_OBJECT_CLASS (g_charset_converter_parent_class)->finalize (object);
90 static void
91 g_charset_converter_set_property (GObject *object,
92 guint prop_id,
93 const GValue *value,
94 GParamSpec *pspec)
96 GCharsetConverter *conv;
98 conv = G_CHARSET_CONVERTER (object);
100 switch (prop_id)
102 case PROP_TO_CHARSET:
103 g_free (conv->to);
104 conv->to = g_value_dup_string (value);
105 break;
107 case PROP_FROM_CHARSET:
108 g_free (conv->from);
109 conv->from = g_value_dup_string (value);
110 break;
112 case PROP_USE_FALLBACK:
113 conv->use_fallback = g_value_get_boolean (value);
114 break;
116 default:
117 G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
118 break;
123 static void
124 g_charset_converter_get_property (GObject *object,
125 guint prop_id,
126 GValue *value,
127 GParamSpec *pspec)
129 GCharsetConverter *conv;
131 conv = G_CHARSET_CONVERTER (object);
133 switch (prop_id)
135 case PROP_TO_CHARSET:
136 g_value_set_string (value, conv->to);
137 break;
139 case PROP_FROM_CHARSET:
140 g_value_set_string (value, conv->from);
141 break;
143 case PROP_USE_FALLBACK:
144 g_value_set_boolean (value, conv->use_fallback);
145 break;
147 default:
148 G_OBJECT_WARN_INVALID_PROPERTY_ID (object, prop_id, pspec);
149 break;
153 static void
154 g_charset_converter_class_init (GCharsetConverterClass *klass)
156 GObjectClass *gobject_class = G_OBJECT_CLASS (klass);
158 gobject_class->finalize = g_charset_converter_finalize;
159 gobject_class->get_property = g_charset_converter_get_property;
160 gobject_class->set_property = g_charset_converter_set_property;
162 g_object_class_install_property (gobject_class,
163 PROP_TO_CHARSET,
164 g_param_spec_string ("to-charset",
165 P_("To Charset"),
166 P_("The character encoding to convert to"),
167 NULL,
168 G_PARAM_READWRITE | G_PARAM_CONSTRUCT_ONLY |
169 G_PARAM_STATIC_STRINGS));
170 g_object_class_install_property (gobject_class,
171 PROP_FROM_CHARSET,
172 g_param_spec_string ("from-charset",
173 P_("From Charset"),
174 P_("The character encoding to convert from"),
175 NULL,
176 G_PARAM_READWRITE | G_PARAM_CONSTRUCT_ONLY |
177 G_PARAM_STATIC_STRINGS));
178 g_object_class_install_property (gobject_class,
179 PROP_USE_FALLBACK,
180 g_param_spec_boolean ("use-fallback",
181 P_("Fallback enabled"),
182 P_("Use fallback (of form \\<hexval>) for invalid bytes"),
183 FALSE,
184 G_PARAM_READWRITE |
185 G_PARAM_CONSTRUCT |
186 G_PARAM_STATIC_STRINGS));
189 static void
190 g_charset_converter_init (GCharsetConverter *local)
196 * g_charset_converter_new:
197 * @to_charset: destination charset
198 * @from_charset: source charset
199 * @error: #GError for error reporting, or %NULL to ignore.
201 * Creates a new #GCharsetConverter.
203 * Returns: a new #GCharsetConverter or %NULL on error.
205 * Since: 2.24
207 GCharsetConverter *
208 g_charset_converter_new (const gchar *to_charset,
209 const gchar *from_charset,
210 GError **error)
212 GCharsetConverter *conv;
214 conv = g_initable_new (G_TYPE_CHARSET_CONVERTER,
215 NULL, error,
216 "to-charset", to_charset,
217 "from-charset", from_charset,
218 NULL);
220 return conv;
223 static void
224 g_charset_converter_reset (GConverter *converter)
226 GCharsetConverter *conv = G_CHARSET_CONVERTER (converter);
228 if (conv->iconv == NULL)
230 g_warning ("Invalid object, not initialized");
231 return;
234 g_iconv (conv->iconv, NULL, NULL, NULL, NULL);
235 conv->n_fallback_errors = 0;
238 static GConverterResult
239 g_charset_converter_convert (GConverter *converter,
240 const void *inbuf,
241 gsize inbuf_size,
242 void *outbuf,
243 gsize outbuf_size,
244 GConverterFlags flags,
245 gsize *bytes_read,
246 gsize *bytes_written,
247 GError **error)
249 GCharsetConverter *conv;
250 gsize res;
251 GConverterResult ret;
252 gchar *inbufp, *outbufp;
253 gsize in_left, out_left;
254 int errsv;
255 gboolean reset;
257 conv = G_CHARSET_CONVERTER (converter);
259 if (conv->iconv == NULL)
261 g_set_error_literal (error, G_IO_ERROR, G_IO_ERROR_NOT_INITIALIZED,
262 _("Invalid object, not initialized"));
263 return G_CONVERTER_ERROR;
266 inbufp = (char *)inbuf;
267 outbufp = (char *)outbuf;
268 in_left = inbuf_size;
269 out_left = outbuf_size;
270 reset = FALSE;
272 /* if there is not input try to flush the data */
273 if (inbuf_size == 0)
275 if (flags & G_CONVERTER_INPUT_AT_END ||
276 flags & G_CONVERTER_FLUSH)
278 reset = TRUE;
280 else
282 g_set_error_literal (error, G_IO_ERROR, G_IO_ERROR_PARTIAL_INPUT,
283 _("Incomplete multibyte sequence in input"));
284 return G_CONVERTER_ERROR;
288 if (reset)
289 /* call g_iconv with NULL inbuf to cleanup shift state */
290 res = g_iconv (conv->iconv,
291 NULL, &in_left,
292 &outbufp, &out_left);
293 else
294 res = g_iconv (conv->iconv,
295 &inbufp, &in_left,
296 &outbufp, &out_left);
298 *bytes_read = inbufp - (char *)inbuf;
299 *bytes_written = outbufp - (char *)outbuf;
301 /* Don't report error if we converted anything */
302 if (res == (gsize) -1 && *bytes_read == 0)
304 errsv = errno;
306 switch (errsv)
308 case EINVAL:
309 /* Incomplete input text */
310 g_set_error_literal (error, G_IO_ERROR, G_IO_ERROR_PARTIAL_INPUT,
311 _("Incomplete multibyte sequence in input"));
312 break;
314 case E2BIG:
315 /* Not enough destination space */
316 g_set_error_literal (error, G_IO_ERROR, G_IO_ERROR_NO_SPACE,
317 _("Not enough space in destination"));
318 break;
320 case EILSEQ:
321 /* Invalid code sequence */
322 if (conv->use_fallback)
324 if (outbuf_size < 3)
325 g_set_error_literal (error, G_IO_ERROR, G_IO_ERROR_NO_SPACE,
326 _("Not enough space in destination"));
327 else
329 const char hex[] = "0123456789ABCDEF";
330 guint8 v = *(guint8 *)inbuf;
331 guint8 *out = (guint8 *)outbuf;
332 out[0] = '\\';
333 out[1] = hex[(v & 0xf0) >> 4];
334 out[2] = hex[(v & 0x0f) >> 0];
335 *bytes_read = 1;
336 *bytes_written = 3;
337 in_left--;
338 conv->n_fallback_errors++;
339 goto ok;
342 else
343 g_set_error_literal (error, G_IO_ERROR, G_IO_ERROR_INVALID_DATA,
344 _("Invalid byte sequence in conversion input"));
345 break;
347 default:
348 g_set_error (error, G_IO_ERROR, G_IO_ERROR_FAILED,
349 _("Error during conversion: %s"),
350 g_strerror (errsv));
351 break;
353 ret = G_CONVERTER_ERROR;
355 else
358 ret = G_CONVERTER_CONVERTED;
360 if (reset &&
361 (flags & G_CONVERTER_INPUT_AT_END))
362 ret = G_CONVERTER_FINISHED;
363 else if (reset &&
364 (flags & G_CONVERTER_FLUSH))
365 ret = G_CONVERTER_FLUSHED;
368 return ret;
372 * g_charset_converter_set_use_fallback:
373 * @converter: a #GCharsetConverter
374 * @use_fallback: %TRUE to use fallbacks
376 * Sets the #GCharsetConverter:use-fallback property.
378 * Since: 2.24
380 void
381 g_charset_converter_set_use_fallback (GCharsetConverter *converter,
382 gboolean use_fallback)
384 use_fallback = !!use_fallback;
386 if (converter->use_fallback != use_fallback)
388 converter->use_fallback = use_fallback;
389 g_object_notify (G_OBJECT (converter), "use-fallback");
394 * g_charset_converter_get_use_fallback:
395 * @converter: a #GCharsetConverter
397 * Gets the #GCharsetConverter:use-fallback property.
399 * Returns: %TRUE if fallbacks are used by @converter
401 * Since: 2.24
403 gboolean
404 g_charset_converter_get_use_fallback (GCharsetConverter *converter)
406 return converter->use_fallback;
410 * g_charset_converter_get_num_fallbacks:
411 * @converter: a #GCharsetConverter
413 * Gets the number of fallbacks that @converter has applied so far.
415 * Returns: the number of fallbacks that @converter has applied
417 * Since: 2.24
419 guint
420 g_charset_converter_get_num_fallbacks (GCharsetConverter *converter)
422 return converter->n_fallback_errors;
425 static void
426 g_charset_converter_iface_init (GConverterIface *iface)
428 iface->convert = g_charset_converter_convert;
429 iface->reset = g_charset_converter_reset;
432 static gboolean
433 g_charset_converter_initable_init (GInitable *initable,
434 GCancellable *cancellable,
435 GError **error)
437 GCharsetConverter *conv;
439 g_return_val_if_fail (G_IS_CHARSET_CONVERTER (initable), FALSE);
441 conv = G_CHARSET_CONVERTER (initable);
443 if (cancellable != NULL)
445 g_set_error_literal (error, G_IO_ERROR, G_IO_ERROR_NOT_SUPPORTED,
446 _("Cancellable initialization not supported"));
447 return FALSE;
450 conv->iconv =
451 g_iconv_open (conv->to, conv->from);
453 if (conv->iconv == (GIConv)-1)
455 if (errno == EINVAL)
456 g_set_error (error, G_IO_ERROR, G_IO_ERROR_NOT_SUPPORTED,
457 _("Conversion from character set '%s' to '%s' is not supported"),
458 conv->from, conv->to);
459 else
460 g_set_error (error, G_IO_ERROR, G_IO_ERROR_FAILED,
461 _("Could not open converter from '%s' to '%s'"),
462 conv->from, conv->to);
463 return FALSE;
466 return TRUE;
469 static void
470 g_charset_converter_initable_iface_init (GInitableIface *iface)
472 iface->init = g_charset_converter_initable_init;