/* convert-emoji.c: A tool to create an Emoji data GVariant * Copyright 2017, Red Hat, Inc. * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Lesser General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Lesser General Public License for more details. * * You should have received a copy of the GNU Lesser General Public * License along with this library. If not, see . */ /* Build with gcc -o convert-emoji convert-emoji.c `pkg-config --cflags --libs json-glib-1.0` */ /* Reads data from the json files in emojibase, expecting * language-specific data.raw.json as input */ /* The format of the generated data is: a(ausasu). * Each member of the array has the following fields: * au - sequence of unicode codepoints. If the * sequence contains a 0, it marks the point * where skin tone modifiers should be inserted * s - name, e.g. "man worker" * as - keywords, e.g. "man", "worker" * u - the group that this item belongs to: * 0: smileys-emotion * 1: people-body * 2: component * 3: animals-nature * 4: food-drink * 5: travel-places * 6: activities * 7: objects * 8: symbols * 9: flags */ #include #include gboolean parse_code (GVariantBuilder *b, const char *code) { g_auto(GStrv) strv = NULL; int j; strv = g_strsplit (code, "-", -1); for (j = 0; strv[j]; j++) { guint32 u; char *end; u = (guint32) g_ascii_strtoull (strv[j], &end, 16); if (*end != '\0') { g_error ("failed to parse code: %s\n", strv[j]); return FALSE; } if (0x1f3fb <= u && u <= 0x1f3ff) g_variant_builder_add (b, "u", 0); else g_variant_builder_add (b, "u", u); } return TRUE; } int main (int argc, char *argv[]) { JsonParser *parser; JsonNode *root; JsonObject *ro; JsonArray *array; JsonNode *node; const char *unicode; JsonObjectIter iter; GError *error = NULL; guint length, i; GVariantBuilder builder; GVariant *v; GString *s; GHashTable *names; GString *name_key; if (argc != 3) { g_print ("Usage: emoji-convert INPUT OUTPUT\n"); return 1; } parser = json_parser_new (); if (!json_parser_load_from_file (parser, argv[1], &error)) { g_error ("%s", error->message); return 1; } root = json_parser_get_root (parser); array = json_node_get_array (root); length = json_array_get_length (array); g_variant_builder_init (&builder, G_VARIANT_TYPE ("a(ausasu)")); for (i = 0; i < length; i++) { JsonObject *obj = json_array_get_object_element (array, i); GVariantBuilder b1; GVariantBuilder b2; guint group; const char *name; char *code; if (!json_object_has_member (obj, "group")) continue; group = json_object_get_int_member (obj, "group"); name = json_object_get_string_member (obj, "label"); if (json_object_has_member (obj, "skins")) { JsonArray *a2 = json_object_get_array_member (obj, "skins"); JsonNode *n2 = json_array_get_element (a2, 0); JsonObject *o2 = json_node_get_object (n2); code = g_strdup (json_object_get_string_member (o2, "hexcode")); } else { code = g_strdup (json_object_get_string_member (obj, "hexcode")); } g_variant_builder_init (&b1, G_VARIANT_TYPE ("au")); if (!parse_code (&b1, code)) return 1; g_variant_builder_init (&b2, G_VARIANT_TYPE ("as")); if (json_object_has_member (obj, "tags")) { JsonArray *tags = json_object_get_array_member (obj, "tags"); for (int j = 0; j < json_array_get_length (tags); j++) g_variant_builder_add (&b2, "s", json_array_get_string_element (tags, j)); } g_variant_builder_add (&builder, "(ausasu)", &b1, name, &b2, group); } v = g_variant_builder_end (&builder); if (g_str_has_suffix (argv[2], ".json")) { JsonNode *node; char *out; node = json_gvariant_serialize (v); out = json_to_string (node, TRUE); if (!g_file_set_contents (argv[2], out, -1, &error)) { g_error ("%s", error->message); return 1; } } else { GBytes *bytes; bytes = g_variant_get_data_as_bytes (v); if (!g_file_set_contents (argv[2], g_bytes_get_data (bytes, NULL), g_bytes_get_size (bytes), &error)) { g_error ("%s", error->message); return 1; } } return 0; }