Do not open a second window for MooLua/window test

This commit is contained in:
Yevgen Muntyan 2012-08-11 01:24:22 -07:00
parent 54ef440232
commit b46ab8dfe4
4 changed files with 448 additions and 379 deletions

View File

@ -1,6 +1,7 @@
require("munit") require("munit")
window = editor.new_window() editor.close_docs(editor.get_docs())
window = editor.get_active_window()
tassert(#window.get_docs() == 1) tassert(#window.get_docs() == 1)
tassert(window.get_docs()[1] == window.get_active_doc()) tassert(window.get_docs()[1] == window.get_active_doc())
editor.new_doc(window) editor.new_doc(window)
@ -85,5 +86,3 @@ tassert_eq(doc1.get_n_views(), 1)
tassert(editor.close_docs({doc1, doc2, doc3})) tassert(editor.close_docs({doc1, doc2, doc3}))
tassert_eq(window.get_docs(), {doc4}) tassert_eq(window.get_docs(), {doc4})
tassert_eq(editor.get_active_doc(), doc4) tassert_eq(editor.get_active_doc(), doc4)
window.close()

View File

@ -44,13 +44,8 @@
#include <glib/gstdio.h> #include <glib/gstdio.h>
#undef LOAD_BINARY
#define ENCODING_LOCALE "LOCALE" #define ENCODING_LOCALE "LOCALE"
#ifndef O_BINARY
#define O_BINARY 0
#endif
MOO_DEFINE_QUARK (MooEditFileErrorQuark, _moo_edit_file_error_quark) MOO_DEFINE_QUARK (MooEditFileErrorQuark, _moo_edit_file_error_quark)
static GSList *UNTITLED = NULL; static GSList *UNTITLED = NULL;
@ -64,11 +59,10 @@ static void file_deleted (MooEdit *edit);
static void add_status (MooEdit *edit, static void add_status (MooEdit *edit,
MooEditStatus s); MooEditStatus s);
static gboolean moo_edit_load_local (MooEdit *edit, static void moo_edit_load_text (MooEdit *edit,
GFile *file, GFile *file,
const char *encoding, const char *encoding,
const char *cached_encoding, const char *text);
GError **error);
static gboolean moo_edit_reload_local (MooEdit *edit, static gboolean moo_edit_reload_local (MooEdit *edit,
const char *encoding, const char *encoding,
GError **error); GError **error);
@ -84,6 +78,13 @@ static gboolean moo_edit_save_copy_local (MooEdit *edit,
GError **error); GError **error);
static void _moo_edit_start_file_watch (MooEdit *edit); static void _moo_edit_start_file_watch (MooEdit *edit);
static char *moo_convert_file_data_to_utf8 (const char *data,
gsize len,
const char *encoding,
const char *cached_encoding,
char **used_enc);
static gboolean check_regular (GFile *file,
GError **error);
gboolean gboolean
_moo_is_file_error_cancelled (GError *error) _moo_is_file_error_cancelled (GError *error)
@ -117,38 +118,57 @@ _moo_edit_file_is_new (GFile *file)
} }
gboolean static gboolean
_moo_edit_load_file (MooEdit *edit, load_file_contents (GFile *gfile,
GFile *file, char **data,
const char *encoding, gsize *data_len,
const char *cached_encoding, GError **error)
GError **error)
{ {
char *freeme1 = NULL; char *path = NULL;
char *freeme2 = NULL; gboolean retval = FALSE;
gboolean result;
if (!check_regular (gfile, error))
return FALSE;
if (!(path = g_file_get_path (gfile)))
{
g_set_error (error, MOO_EDIT_FILE_ERROR,
MOO_EDIT_FILE_ERROR_NOT_IMPLEMENTED,
"Loading remote files is not implemented");
return FALSE;
}
retval = g_file_get_contents (path, data, data_len, error);
g_free (path);
return retval;
}
static char *
convert_file_data_to_utf8_with_prompt (const char *data,
gsize data_len,
GFile *file,
const char *encoding,
const char *cached_encoding,
char **used_encoding,
GError **error)
{
char *freeme = NULL;
char *text_utf8 = NULL;
GError *error_here = NULL; GError *error_here = NULL;
char *new_encoding = NULL;
moo_return_error_if_fail (MOO_IS_EDIT (edit));
moo_return_error_if_fail (G_IS_FILE (file));
moo_return_error_if_fail (!MOO_EDIT_IS_BUSY (edit));
encoding = freeme1 = g_strdup (normalize_encoding (encoding, FALSE));
cached_encoding = freeme2 = cached_encoding ? g_strdup (normalize_encoding (cached_encoding, FALSE)) : NULL;
while (TRUE) while (TRUE)
{ {
char *new_encoding = NULL;
MooEditTryEncodingResponse response; MooEditTryEncodingResponse response;
result = moo_edit_load_local (edit, file, encoding, cached_encoding, &error_here); text_utf8 = moo_convert_file_data_to_utf8 (data, data_len, encoding, cached_encoding, &new_encoding);
if (result) if (text_utf8)
break; break;
if (!error_here || error_here->domain != MOO_EDIT_FILE_ERROR || g_free (new_encoding);
error_here->code != MOO_EDIT_FILE_ERROR_ENCODING) new_encoding = NULL;
break;
response = _moo_edit_try_encoding_dialog (file, encoding, &new_encoding); response = _moo_edit_try_encoding_dialog (file, encoding, &new_encoding);
@ -173,14 +193,64 @@ _moo_edit_load_file (MooEdit *edit,
if (!new_encoding) if (!new_encoding)
break; break;
g_free (freeme1); g_free (freeme);
encoding = freeme1 = new_encoding; encoding = freeme = new_encoding;
cached_encoding = NULL; cached_encoding = NULL;
} }
if (error_here) if (error_here)
g_propagate_error (error, error_here); g_propagate_error (error, error_here);
*used_encoding = g_strdup (new_encoding);
g_free (freeme);
return text_utf8;
}
gboolean
_moo_edit_load_file (MooEdit *edit,
GFile *file,
const char *encoding,
const char *cached_encoding,
GError **error)
{
char *freeme1 = NULL;
char *freeme2 = NULL;
gboolean result = FALSE;
GError *error_here = NULL;
char *data = NULL;
gsize data_len = 0;
char *data_utf8 = NULL;
char *used_encoding = NULL;
moo_return_error_if_fail (MOO_IS_EDIT (edit));
moo_return_error_if_fail (G_IS_FILE (file));
moo_return_error_if_fail (!MOO_EDIT_IS_BUSY (edit));
encoding = freeme1 = g_strdup (normalize_encoding (encoding, FALSE));
cached_encoding = freeme2 = cached_encoding ? g_strdup (normalize_encoding (cached_encoding, FALSE)) : NULL;
if (!load_file_contents (file, &data, &data_len, &error_here))
goto done;
data_utf8 = convert_file_data_to_utf8_with_prompt (data, data_len, file, encoding, cached_encoding, &used_encoding, &error_here);
if (data_utf8 == NULL)
goto done;
moo_edit_load_text (edit, file, used_encoding, data_utf8);
result = TRUE;
done:
if (!result)
_moo_edit_stop_file_watch (edit);
if (error_here)
g_propagate_error (error, error_here);
g_free (used_encoding);
g_free (data_utf8);
g_free (data);
g_free (freeme1); g_free (freeme1);
g_free (freeme2); g_free (freeme2);
return result; return result;
@ -311,21 +381,8 @@ moo_edit_set_line_end_type (MooEdit *edit,
/* File loading /* File loading
*/ */
typedef enum { static void do_load_text (MooEdit *edit,
SUCCESS, const char *text);
ERROR_FILE,
ERROR_ENCODING
} LoadResult;
static LoadResult do_load (MooEdit *edit,
GFile *file,
const char *encoding,
GError **error);
#ifdef LOAD_BINARY
static LoadResult load_binary (MooEdit *edit,
const char *file,
GError **error);
#endif
static GSList * static GSList *
get_encodings (void) get_encodings (void)
@ -371,32 +428,6 @@ get_encodings (void)
} }
static LoadResult
try_load (MooEdit *edit,
GFile *file,
const char *encoding,
GError **error)
{
GtkTextBuffer *buffer;
gboolean enable_highlight;
LoadResult result = ERROR_FILE;
g_return_val_if_fail (MOO_IS_EDIT (edit), result);
g_return_val_if_fail (G_IS_FILE (file), result);
g_return_val_if_fail (encoding && encoding[0], result);
buffer = moo_edit_get_buffer (edit);
gtk_text_buffer_set_text (buffer, "", 0);
g_object_get (buffer, "highlight-syntax", &enable_highlight, (char*) 0);
g_object_set (buffer, "highlight-syntax", FALSE, (char*) 0);
result = do_load (edit, file, encoding, error);
g_object_set (buffer, "highlight-syntax", enable_highlight, (char*) 0);
return result;
}
static gboolean static gboolean
check_regular (GFile *file, check_regular (GFile *file,
GError **error) GError **error)
@ -424,26 +455,18 @@ check_regular (GFile *file,
return retval; return retval;
} }
static gboolean static void
moo_edit_load_local (MooEdit *edit, moo_edit_load_text (MooEdit *edit,
GFile *file, GFile *file,
const char *encoding, const char *encoding,
const char *cached_encoding, const char *text)
GError **error)
{ {
GtkTextIter start; GtkTextIter start;
GtkTextBuffer *buffer; GtkTextBuffer *buffer;
gboolean undo; gboolean undo;
LoadResult result = ERROR_FILE;
char *freeme = NULL; char *freeme = NULL;
MooLineEndType saved_le; MooLineEndType saved_le;
moo_return_error_if_fail (MOO_IS_EDIT (edit));
moo_return_error_if_fail (G_IS_FILE (file));
if (!check_regular (file, error))
return FALSE;
if (moo_edit_is_empty (edit)) if (moo_edit_is_empty (edit))
undo = FALSE; undo = FALSE;
else else
@ -462,75 +485,18 @@ moo_edit_load_local (MooEdit *edit,
saved_le = edit->priv->line_end_type; saved_le = edit->priv->line_end_type;
if (!encoding)
{ {
GSList *encodings; gboolean enable_highlight;
buffer = moo_edit_get_buffer (edit);
encodings = get_encodings ();
if (cached_encoding)
encodings = g_slist_prepend (encodings, g_strdup (cached_encoding));
result = ERROR_ENCODING;
while (encodings)
{
char *enc;
enc = (char*) encodings->data;
encodings = g_slist_delete_link (encodings, encodings);
g_clear_error (error);
result = try_load (edit, file, enc, error);
if (result != ERROR_ENCODING)
{
encoding = freeme = enc;
break;
}
g_free (enc);
}
g_slist_foreach (encodings, (GFunc) g_free, NULL);
g_slist_free (encodings);
}
else
{
result = try_load (edit, file, encoding, error);
}
#ifdef LOAD_BINARY
if (result == ERROR_ENCODING)
{
g_clear_error (error);
result = load_binary (edit, file, &statbuf, error);
}
#endif
if (result == ERROR_ENCODING)
set_encoding_error (error);
if (result != SUCCESS)
gtk_text_buffer_set_text (buffer, "", 0); gtk_text_buffer_set_text (buffer, "", 0);
g_object_get (buffer, "highlight-syntax", &enable_highlight, (char*) 0);
g_object_set (buffer, "highlight-syntax", FALSE, (char*) 0);
do_load_text (edit, text);
g_object_set (buffer, "highlight-syntax", enable_highlight, (char*) 0);
}
unblock_buffer_signals (edit); unblock_buffer_signals (edit);
if (result == SUCCESS)
{
/* XXX */
gtk_text_buffer_get_start_iter (buffer, &start);
gtk_text_buffer_place_cursor (buffer, &start);
edit->priv->status = (MooEditStatus) 0;
moo_edit_set_modified (edit, FALSE);
_moo_edit_set_file (edit, file, encoding);
if (edit->priv->line_end_type != saved_le)
g_object_notify (G_OBJECT (edit), "line-end-type");
_moo_edit_start_file_watch (edit);
}
else
{
_moo_edit_stop_file_watch (edit);
}
if (undo) if (undo)
gtk_text_buffer_end_user_action (buffer); gtk_text_buffer_end_user_action (buffer);
else else
@ -538,151 +504,88 @@ moo_edit_load_local (MooEdit *edit,
moo_text_buffer_end_non_interactive_action (MOO_TEXT_BUFFER (buffer)); moo_text_buffer_end_non_interactive_action (MOO_TEXT_BUFFER (buffer));
gtk_text_buffer_get_start_iter (buffer, &start);
gtk_text_buffer_place_cursor (buffer, &start);
edit->priv->status = (MooEditStatus) 0;
moo_edit_set_modified (edit, FALSE);
_moo_edit_set_file (edit, file, encoding);
if (edit->priv->line_end_type != saved_le)
g_object_notify (G_OBJECT (edit), "line-end-type");
_moo_edit_start_file_watch (edit);
g_free (freeme); g_free (freeme);
return result == SUCCESS;
} }
static LoadResult static void
do_load (MooEdit *edit, do_load_text (MooEdit *edit,
GFile *gfile, const char *text)
const char *encoding,
GError **error)
{ {
GIOChannel *file = NULL;
GIOStatus status;
GtkTextBuffer *buffer; GtkTextBuffer *buffer;
MooLineEndType le = MOO_LE_NONE; MooLineEndType le = MOO_LE_NONE;
gboolean mixed_le = FALSE; gboolean mixed_le = FALSE;
GString *text = NULL; const char *line = NULL;
char *line = NULL; MooLineReader lr;
LoadResult result = ERROR_FILE; gsize line_len;
char *path; gsize line_term_len;
GString *strbuf;
g_return_val_if_fail (G_IS_FILE (gfile), ERROR_FILE); strbuf = g_string_new (NULL);
g_return_val_if_fail (encoding != NULL, ERROR_FILE);
if (!(path = g_file_get_path (gfile)))
{
g_set_error (error, MOO_EDIT_FILE_ERROR,
MOO_EDIT_FILE_ERROR_NOT_IMPLEMENTED,
"Loading remote files is not implemented");
return ERROR_FILE;
}
file = g_io_channel_new_file (path, "r", error);
g_free (path);
if (!file)
return ERROR_FILE;
if (g_io_channel_set_encoding (file, encoding, error) != G_IO_STATUS_NORMAL)
{
result = ERROR_ENCODING;
goto error_out;
}
text = g_string_new (NULL);
buffer = moo_edit_get_buffer (edit); buffer = moo_edit_get_buffer (edit);
while (TRUE) moo_line_reader_init (&lr, text, -1);
while ((line = moo_line_reader_get_line (&lr, &line_len, &line_term_len)) != NULL)
{ {
gboolean insert_line_term = FALSE; gboolean insert_line_term = FALSE;
gsize len, line_term_pos;
MooLineEndType le_here = MOO_LE_NONE; MooLineEndType le_here = MOO_LE_NONE;
gsize copy_len = line_len;
status = g_io_channel_read_line (file, &line, &len, &line_term_pos, error); if (line_term_len != 0)
if (status != G_IO_STATUS_NORMAL && status != G_IO_STATUS_EOF)
{ {
if ((*error)->domain == G_CONVERT_ERROR) const char *line_term = line + line_len;
result = ERROR_ENCODING;
insert_line_term = TRUE;
if (line_term_len == 1 && !strncmp (line_term, "\r", line_term_len))
{
le_here = MOO_LE_MAC;
}
else if (line_term_len == 1 && !strncmp (line_term, "\n", line_term_len))
{
le_here = MOO_LE_UNIX;
}
else if (line_term_len == 2 && !strncmp (line_term, "\r\n", line_term_len))
{
le_here = MOO_LE_WIN32;
}
else if (line_term_len == 3 && !strncmp ("\xe2\x80\xa9", line_term, line_term_len))
{
insert_line_term = FALSE;
copy_len += line_term_len;
}
else else
result = ERROR_FILE; {
goto error_out; g_critical ("oops");
copy_len += line_term_len;
}
if (le_here)
{
if (mixed_le || (le && le != le_here))
mixed_le = TRUE;
else
le = le_here;
}
} }
if (line) g_string_append_len (strbuf, line, copy_len);
{
const char *invalid;
gboolean valid_utf8 = g_utf8_validate (line, len, &invalid);
// allow trailing zero byte if (insert_line_term)
if (!valid_utf8 && invalid + 1 == line + len && *invalid == 0) g_string_append_c (strbuf, '\n');
{
valid_utf8 = TRUE;
len -= 1;
}
if (!valid_utf8)
{
result = ERROR_ENCODING;
g_set_error (error, G_CONVERT_ERROR,
G_CONVERT_ERROR_ILLEGAL_SEQUENCE,
"Invalid UTF8 data read from file");
goto error_out;
}
if (line_term_pos != len)
{
char *line_term = line + line_term_pos;
insert_line_term = TRUE;
len = line_term_pos;
if (!strcmp ("\xe2\x80\xa9", line_term))
{
insert_line_term = FALSE;
len = len + 3;
}
else if (!strcmp (line_term, "\r"))
{
le_here = MOO_LE_MAC;
}
else if (!strcmp (line_term, "\n"))
{
le_here = MOO_LE_UNIX;
}
else if (!strcmp (line_term, "\r\n"))
{
le_here = MOO_LE_WIN32;
}
if (le_here)
{
if (mixed_le || (le && le != le_here))
mixed_le = TRUE;
else
le = le_here;
}
}
g_string_append_len (text, line, len);
if (insert_line_term)
g_string_append_c (text, '\n');
#define MAX_TEXT_BUF_LEN 1000000
if (text->len > MAX_TEXT_BUF_LEN)
{
gtk_text_buffer_insert_at_cursor (buffer, text->str, text->len);
g_string_truncate (text, 0);
}
#undef MAX_TEXT_BUF_LEN
g_free (line);
}
if (status == G_IO_STATUS_EOF)
{
g_io_channel_shutdown (file, TRUE, NULL);
g_io_channel_unref (file);
break;
}
} }
if (text->len) gtk_text_buffer_insert_at_cursor (buffer, strbuf->str, strbuf->len);
gtk_text_buffer_insert_at_cursor (buffer, text->str, text->len);
if (mixed_le) if (mixed_le)
le = MOO_LE_NATIVE; le = MOO_LE_NATIVE;
@ -690,108 +593,10 @@ do_load (MooEdit *edit,
if (le != MOO_LE_NONE) if (le != MOO_LE_NONE)
moo_edit_set_line_end_type_full (edit, le, TRUE); moo_edit_set_line_end_type_full (edit, le, TRUE);
g_string_free (text, TRUE); g_string_free (strbuf, TRUE);
g_clear_error (error);
return SUCCESS;
error_out:
if (text)
g_string_free (text, TRUE);
if (file)
{
g_io_channel_shutdown (file, TRUE, NULL);
g_io_channel_unref (file);
}
g_free (line);
return result;
} }
#ifdef LOAD_BINARY
#define TEXT_BUF_LEN (1 << 16)
#define REPLACEMENT_CHAR '\1'
#define LINE_LEN 80
static LoadResult
load_binary (MooEdit *edit,
const char *filename,
GError **error)
{
GIOChannel *file = NULL;
GIOStatus status;
GtkTextBuffer *buffer;
moo_return_error_if_fail (filename != NULL);
buffer = moo_edit_get_buffer (edit);
file = g_io_channel_new_file (filename, "r", error);
if (!file)
return ERROR_FILE;
g_io_channel_set_encoding (file, NULL, NULL);
while (TRUE)
{
gsize len, line_len;
char buf[TEXT_BUF_LEN];
status = g_io_channel_read_chars (file, buf, TEXT_BUF_LEN, &len, error);
if (status != G_IO_STATUS_NORMAL && status != G_IO_STATUS_EOF)
goto error_out;
if (len)
{
guint i;
for (i = 0, line_len = 0; i < len; ++i, ++line_len)
{
if (buf[i] && !(buf[i] & 0x80))
continue;
if (line_len > LINE_LEN)
{
buf[i] = '\n';
line_len = 0;
}
else
{
buf[i] = REPLACEMENT_CHAR;
}
}
gtk_text_buffer_insert_at_cursor (buffer, buf, len);
}
if (status == G_IO_STATUS_EOF)
{
g_io_channel_shutdown (file, TRUE, NULL);
g_io_channel_unref (file);
break;
}
}
g_clear_error (error);
return SUCCESS;
error_out:
if (file)
{
g_io_channel_shutdown (file, TRUE, NULL);
g_io_channel_unref (file);
}
return ERROR_FILE;
}
#undef TEXT_BUF_LEN
#undef REPLACEMENT_CHAR
#undef LINE_LEN
#endif
/* XXX */ /* XXX */
static gboolean static gboolean
moo_edit_reload_local (MooEdit *edit, moo_edit_reload_local (MooEdit *edit,
@ -1347,3 +1152,250 @@ _moo_edit_get_icon (MooEdit *doc,
else else
return moo_get_icon_for_path (NULL, widget, size); return moo_get_icon_for_path (NULL, widget, size);
} }
/***************************************************************************
*
* Character encoding conversion
*
*/
#define BOM_UTF8 "\xEF\xBB\xBF"
#define BOM_UTF16 "\xFF\xFE"
#define BOM_UTF16_BE "\xFE\xFF"
#define BOM_UTF32 "\xFF\xFE\x00\x00"
#define BOM_UTF32_BE "\x00\x00\xFE\xFF"
static const struct {
const char *enc;
const char *enc_no_bom;
const char *bom;
gsize bom_len;
} bom_encs[] = {
{ "UTF-8-BOM", "UTF-8", BOM_UTF8, 3 },
{ "UTF-16-BOM", "UTF-16", BOM_UTF16, 2 },
{ "UTF-16BE-BOM", "UTF-16BE", BOM_UTF16_BE, 2 },
{ "UTF-32-BOM", "UTF-32", BOM_UTF32, 4 },
{ "UTF-32BE-BOM", "UTF-32BE", BOM_UTF32_BE, 4 },
};
static gboolean
encoding_needs_bom (const char *enc,
const char **enc_no_bom,
const char **bom,
gsize *bom_len)
{
guint i;
for (i = 0; i < G_N_ELEMENTS (bom_encs); ++i)
{
if (!g_ascii_strcasecmp (enc, bom_encs[i].enc))
{
*enc_no_bom = bom_encs[i].enc_no_bom;
*bom = bom_encs[i].bom;
*bom_len = bom_encs[i].bom_len;
return TRUE;
}
}
return FALSE;
}
static gboolean
encoding_allows_bom (const char *enc,
const char **bom,
gsize *bom_len)
{
guint i;
for (i = 0; i < G_N_ELEMENTS (bom_encs); ++i)
{
if (!g_ascii_strcasecmp (enc, bom_encs[i].enc_no_bom))
{
*bom = bom_encs[i].bom;
*bom_len = bom_encs[i].bom_len;
return TRUE;
}
}
return FALSE;
}
static gboolean
data_has_bom (const char *data,
gsize len,
const char **bom_enc)
{
guint i;
for (i = 0; i < G_N_ELEMENTS (bom_encs); ++i)
{
gsize bom_len = bom_encs[i].bom_len;
const char *bom = bom_encs[i].bom;
if (len >= bom_len && memcmp (data, bom, bom_len) == 0)
{
*bom_enc = bom_encs[i].enc;
return TRUE;
}
}
return FALSE;
}
static char *
try_convert_to_utf8_from_utf8 (const char *data,
gsize len)
{
const char *invalid;
gboolean valid_utf8;
// g_print ("try_convert_to_utf8_from_utf8()\n");
valid_utf8 = g_utf8_validate (data, len, &invalid);
// allow trailing zero byte
if (!valid_utf8 && invalid + 1 == data + len && *invalid == 0)
valid_utf8 = TRUE;
return valid_utf8 ? g_strdup (data) : NULL;
}
static char *
try_convert_to_utf8_from_non_utf8_encoding (const char *data,
gsize len,
const char *enc)
{
const char *enc_no_bom = NULL;
const char *bom = NULL;
gsize bom_len = 0;
gsize bytes_read = 0;
gsize bytes_written = 0;
char *result = NULL;
gsize result_len = 0;
// g_print ("try_convert_to_utf8_from_non_utf8_encoding(%s)\n",
// enc ? enc : "<null>");
if (encoding_needs_bom (enc, &enc_no_bom, &bom, &bom_len))
{
if (len < bom_len)
return NULL;
if (memcmp (bom, data, bom_len) != 0)
return NULL;
data += bom_len;
len -= bom_len;
enc = enc_no_bom;
}
else if (encoding_allows_bom (enc, &bom, &bom_len))
{
if (len >= bom_len && memcmp (bom, data, bom_len) == 0)
{
data += bom_len;
len -= bom_len;
}
}
if (!g_ascii_strcasecmp (enc, "UTF-8"))
return try_convert_to_utf8_from_utf8 (data, len);
result = g_convert (data, len, "UTF-8", enc, &bytes_read, &bytes_written, NULL);
if (!result)
return NULL;
if (bytes_read < len)
{
g_free (result);
return NULL;
}
result_len = strlen (result);
// ignore trailing zero
if (bytes_written == result_len + 1)
bytes_written -= 1;
if (result_len < bytes_written)
{
g_free (result);
return NULL;
}
return result;
}
static char *
try_convert_to_utf8_from_encoding (const char *data,
gsize len,
const char *enc)
{
if (!g_ascii_strcasecmp (enc, "UTF-8"))
return try_convert_to_utf8_from_utf8 (data, len);
else
return try_convert_to_utf8_from_non_utf8_encoding (data, len, enc);
}
static char *
moo_convert_file_data_to_utf8 (const char *data,
gsize len,
const char *encoding,
const char *cached_encoding,
char **used_enc)
{
char *freeme = NULL;
char *result = NULL;
const char *bom_enc = NULL;
// g_print ("moo_convert_file_data_to_utf8(%s, %s)\n",
// encoding ? encoding : "<null>",
// cached_encoding ? cached_encoding : "<null>");
*used_enc = NULL;
if (!encoding && data_has_bom (data, len, &bom_enc))
{
encoding = bom_enc;
result = try_convert_to_utf8_from_encoding (data, len, encoding);
}
else if (!encoding)
{
GSList *encodings;
encodings = get_encodings ();
if (cached_encoding)
encodings = g_slist_prepend (encodings, g_strdup (cached_encoding));
while (encodings)
{
char *enc;
enc = (char*) encodings->data;
encodings = g_slist_delete_link (encodings, encodings);
result = try_convert_to_utf8_from_encoding (data, len, enc);
if (result != NULL)
{
encoding = freeme = enc;
break;
}
g_free (enc);
}
g_slist_foreach (encodings, (GFunc) g_free, NULL);
g_slist_free (encodings);
}
else
{
result = try_convert_to_utf8_from_encoding (data, len, encoding);
}
if (result)
*used_enc = g_strdup (encoding);
g_free (freeme);
return result;
}

View File

@ -70,9 +70,15 @@ static const struct {
{ "UTF-7", N_("Unicode"), "UTF-7", ENCODING_GROUP_UNICODE }, { "UTF-7", N_("Unicode"), "UTF-7", ENCODING_GROUP_UNICODE },
{ "UTF-8", N_("Unicode"), "UTF-8", ENCODING_GROUP_UNICODE }, { "UTF-8", N_("Unicode"), "UTF-8", ENCODING_GROUP_UNICODE },
{ "UTF-8-BOM", N_("Unicode"), "UTF-8 with BOM", ENCODING_GROUP_UNICODE },
{ "UTF-16", N_("Unicode"), "UTF-16", ENCODING_GROUP_UNICODE }, { "UTF-16", N_("Unicode"), "UTF-16", ENCODING_GROUP_UNICODE },
{ "UCS-2", N_("Unicode"), "UCS-2", ENCODING_GROUP_UNICODE }, { "UTF-16BE", N_("Unicode"), "UTF-16BE", ENCODING_GROUP_UNICODE },
{ "UCS-4", N_("Unicode"), "UCS-4", ENCODING_GROUP_UNICODE }, { "UTF-16-BOM", N_("Unicode"), "UTF-16 with BOM", ENCODING_GROUP_UNICODE },
{ "UTF-16BE-BOM", N_("Unicode"), "UTF-16BE with BOM",ENCODING_GROUP_UNICODE },
{ "UTF-32", N_("Unicode"), "UTF-32", ENCODING_GROUP_UNICODE },
{ "UTF-32BE", N_("Unicode"), "UTF-32BE", ENCODING_GROUP_UNICODE },
{ "UTF-32-BOM", N_("Unicode"), "UTF-32 with BOM", ENCODING_GROUP_UNICODE },
{ "UTF-32BE-BOM", N_("Unicode"), "UTF-32BE with BOM",ENCODING_GROUP_UNICODE },
{ "ARMSCII-8", N_("Armenian"), "ARMSCII-8", ENCODING_GROUP_SE_SW_ASIAN }, { "ARMSCII-8", N_("Armenian"), "ARMSCII-8", ENCODING_GROUP_SE_SW_ASIAN },
{ "BIG5", N_("Chinese Traditional"), "Big5", ENCODING_GROUP_EAST_ASIAN }, { "BIG5", N_("Chinese Traditional"), "Big5", ENCODING_GROUP_EAST_ASIAN },

View File

@ -21,8 +21,20 @@
G_BEGIN_DECLS G_BEGIN_DECLS
#define MOO_ENCODING_AUTO "auto" #define MOO_ENCODING_AUTO "auto"
#define MOO_ENCODING_UTF8 "UTF-8" #define MOO_ENCODING_UTF8 "UTF-8"
#define MOO_ENCODING_UTF16 "UTF-16"
#define MOO_ENCODING_UTF16LE "UTF-16LE"
#define MOO_ENCODING_UTF16BE "UTF-16BE"
#define MOO_ENCODING_UTF16LE_BOM "UTF-16LE-BOM"
#define MOO_ENCODING_UTF16BE_BOM "UTF-16BE-BOM"
#define MOO_ENCODING_UTF32 "UTF-32"
#define MOO_ENCODING_UTF32LE "UTF-32LE"
#define MOO_ENCODING_UTF32BE "UTF-32BE"
#define MOO_ENCODING_UTF32LE_BOM "UTF-32LE-BOM"
#define MOO_ENCODING_UTF32BE_BOM "UTF-32BE-BOM"
typedef enum { typedef enum {
MOO_ENCODING_COMBO_OPEN, MOO_ENCODING_COMBO_OPEN,