mirror of
https://gitlab.freedesktop.org/gstreamer/gstreamer.git
synced 2024-11-26 11:41:09 +00:00
tag: add mklicensestables utility
Add (uninstalled) tool to create licenses-table.dat from liblicense's RDF files. It's not very pretty and makes loats of assumptions about the input, but should work. If things change, we can fix it then. https://bugzilla.gnome.org/show_bug.cgi?id=646868
This commit is contained in:
parent
c4bab487e7
commit
25f8f6453e
3 changed files with 905 additions and 3 deletions
5
.gitignore
vendored
5
.gitignore
vendored
|
@ -43,8 +43,9 @@ Makefile
|
|||
*.gir
|
||||
*.typelib
|
||||
|
||||
gst-libs/gst/pbutils/gstpluginsbaseversion.h
|
||||
gst-libs/gst/tag/mklangtables
|
||||
/gst-libs/gst/pbutils/gstpluginsbaseversion.h
|
||||
/gst-libs/gst/tag/mklangtables
|
||||
/gst-libs/gst/tag/mklicensestables
|
||||
|
||||
tmp-orc.c
|
||||
gst*orc.h
|
||||
|
|
|
@ -84,7 +84,18 @@ else
|
|||
ISO_CODE_PROGS =
|
||||
endif
|
||||
|
||||
noinst_PROGRAMS = $(ISO_CODE_PROGS)
|
||||
LICENSE_PROGS = mklicensestables
|
||||
mklicensestables_SOURCES = mklicensestables.c
|
||||
mklicensestables_CFLAGS = $(GST_CFLAGS)
|
||||
mklicensestables_LDADD = $(GST_LIBS)
|
||||
|
||||
noinst_PROGRAMS = $(ISO_CODE_PROGS) $(LICENSE_PROGS)
|
||||
|
||||
update-licenses: mklicensestables
|
||||
$(builddir)/mklicensestables \
|
||||
--translation-dictionary=$(builddir)/license-translations.dict \
|
||||
> $(builddir)/licenses-tables.dat && \
|
||||
echo "Updated licenses-tables.dat and license-translations.dict"
|
||||
|
||||
#if USE_NLS
|
||||
# Yes, this is not great, but it's only an implementation detail. The
|
||||
|
|
890
gst-libs/gst/tag/mklicensestables.c
Normal file
890
gst-libs/gst/tag/mklicensestables.c
Normal file
|
@ -0,0 +1,890 @@
|
|||
/* GStreamer License Utility Functions
|
||||
* Copyright (C) 2011 Tim-Philipp Müller <tim centricular net>
|
||||
*
|
||||
* This library is free software; you can redistribute it and/or
|
||||
* modify it under the terms of the GNU Library General Public
|
||||
* License as published by the Free Software Foundation; either
|
||||
* version 2 of the License, or (at your option) any later version.
|
||||
*
|
||||
* This library is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||||
* Library General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU Library General Public
|
||||
* License along with this library; if not, write to the
|
||||
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
||||
* Boston, MA 02111-1307, USA.
|
||||
*/
|
||||
|
||||
/* mklicensestables.c:
|
||||
* little program that reads liblicense's license RDF files and outputs tables
|
||||
* with the most important information, so we don't have to parse megabytes
|
||||
* of mostly redundant RDF files to get some basic information (and vendors
|
||||
* don't have to ship it all).
|
||||
*/
|
||||
|
||||
#ifdef HAVE_CONFIG_H
|
||||
#include "config.h"
|
||||
#endif
|
||||
|
||||
#include "tag.h"
|
||||
|
||||
#include <string.h>
|
||||
#include <stdlib.h>
|
||||
#include <stdio.h>
|
||||
|
||||
/* TODO: we can merge some of the jurisdiction-only license table entries
|
||||
* into one entry with multiple jurisdictions and without the 'generic' flag,
|
||||
* .e.g. by-nc-nd/2.5/es + by-nc-nd/2.5/au => by-nc-nd/2.5/{es,au} */
|
||||
|
||||
#define LIBLICENSE_DATA_PREFIX "/usr/share/liblicense/licenses"
|
||||
|
||||
static GHashTable *unknown_sources; /* NULL */
|
||||
|
||||
static GList *licenses; /* NULL */
|
||||
|
||||
/* list of languages used for translations */
|
||||
static GList *langs; /* NULL */
|
||||
|
||||
/* keep in sync with licenses.c */
|
||||
static const gchar jurisdictions[] =
|
||||
"ar\000at\000au\000be\000bg\000br\000ca\000ch\000cl\000cn\000co\000de\000"
|
||||
"dk\000es\000fi\000fr\000hr\000hu\000il\000in\000it\000jp\000kr\000mk\000"
|
||||
"mt\000mx\000my\000nl\000pe\000pl\000pt\000scotland\000se\000si\000tw\000"
|
||||
"uk\000us\000za";
|
||||
|
||||
/* keep in sync with gst_tag_get_license_version() */
|
||||
static const gchar known_versions[] = "1.0/2.0/2.1/2.5/3.0/";
|
||||
|
||||
/* is this license 'generic' (and a base for any of the supported
|
||||
* jurisdictions), or jurisdiction-specific only? */
|
||||
#define JURISDICTION_GENERIC (G_GUINT64_CONSTANT (1) << 63)
|
||||
|
||||
typedef struct
|
||||
{
|
||||
gchar *ref;
|
||||
guint64 jurisdiction;
|
||||
gchar *jurisdiction_suffix; /* if not generic (e.g. "jp/") */
|
||||
gchar *legalcode;
|
||||
gchar *version;
|
||||
gchar *replaced_by;
|
||||
gchar *source;
|
||||
|
||||
GstTagLicenseFlags flags;
|
||||
|
||||
gboolean deprecated;
|
||||
|
||||
GHashTable *titles;
|
||||
GHashTable *descriptions;
|
||||
|
||||
/* for processing */
|
||||
const gchar *cur_lang;
|
||||
gboolean packed_into_source;
|
||||
|
||||
/* list of licenses packed into this one (ie. this is the source of those) */
|
||||
GList *derived;
|
||||
} License;
|
||||
|
||||
static GstTagLicenseFlags
|
||||
ref_to_flag (const gchar * ref)
|
||||
{
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#Reproduction") == 0)
|
||||
return GST_TAG_LICENSE_PERMITS_REPRODUCTION;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#Distribution") == 0)
|
||||
return GST_TAG_LICENSE_PERMITS_DISTRIBUTION;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#DerivativeWorks") == 0)
|
||||
return GST_TAG_LICENSE_PERMITS_DERIVATIVE_WORKS;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#Sharing") == 0)
|
||||
return GST_TAG_LICENSE_PERMITS_SHARING;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#Notice") == 0)
|
||||
return GST_TAG_LICENSE_REQUIRES_NOTICE;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#Attribution") == 0)
|
||||
return GST_TAG_LICENSE_REQUIRES_ATTRIBUTION;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#ShareAlike") == 0)
|
||||
return GST_TAG_LICENSE_REQUIRES_SHARE_ALIKE;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#SourceCode") == 0)
|
||||
return GST_TAG_LICENSE_REQUIRES_SOURCE_CODE;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#Copyleft") == 0)
|
||||
return GST_TAG_LICENSE_REQUIRES_COPYLEFT;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#LesserCopyleft") == 0)
|
||||
return GST_TAG_LICENSE_REQUIRES_LESSER_COPYLEFT;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#CommercialUse") == 0)
|
||||
return GST_TAG_LICENSE_PROHIBITS_COMMERCIAL_USE;
|
||||
if (strcmp (ref, "http://creativecommons.org/ns#HighIncomeNationUse") == 0)
|
||||
return GST_TAG_LICENSE_PROHIBITS_HIGH_INCOME_NATION_USE;
|
||||
|
||||
g_error ("Unknown permits/requires/prohibits: %s\n", ref);
|
||||
return 0;
|
||||
};
|
||||
|
||||
static guint64
|
||||
ref_to_jurisdiction (const gchar * ref)
|
||||
{
|
||||
const gchar *j = jurisdictions;
|
||||
gchar *jur;
|
||||
guint64 bit = 1;
|
||||
|
||||
jur = g_strdup (ref + strlen ("http://creativecommons.org/international/"));
|
||||
g_strdelimit (jur, "/", '\0');
|
||||
while (j < jurisdictions + sizeof (jurisdictions)) {
|
||||
if (strcmp (j, jur) == 0) {
|
||||
g_free (jur);
|
||||
g_assert (bit != 0 && bit != JURISDICTION_GENERIC);
|
||||
return bit;
|
||||
}
|
||||
j += strlen (j) + 1;
|
||||
bit <<= 1;
|
||||
}
|
||||
g_error ("Unknown jurisdiction '%s'\n", ref);
|
||||
}
|
||||
|
||||
typedef enum
|
||||
{
|
||||
TAG_CC_LICENSE,
|
||||
TAG_CC_JURISDICTION,
|
||||
TAG_CC_LEGALCODE,
|
||||
TAG_CC_PROHIBITS,
|
||||
TAG_CC_REQUIRES,
|
||||
TAG_CC_PERMITS,
|
||||
TAG_CC_DEPRECATED_ON,
|
||||
TAG_DC_CREATOR,
|
||||
TAG_DC_SOURCE,
|
||||
TAG_DC_TITLE,
|
||||
TAG_DC_DESCRIPTION,
|
||||
TAG_DCQ_HAS_VERSION,
|
||||
TAG_DCQ_IS_REPLACED_BY,
|
||||
TAG_RDF_RDF,
|
||||
TAG_RDF_DESCRIPTION,
|
||||
} Tag;
|
||||
|
||||
static const struct
|
||||
{
|
||||
const gchar *element_name;
|
||||
const gchar *attribute;
|
||||
const Tag element_tag;
|
||||
} tag_map[] = {
|
||||
{
|
||||
"cc:License", "rdf:about", TAG_CC_LICENSE}, {
|
||||
"cc:deprecatedOn", "rdf:datatype", TAG_CC_DEPRECATED_ON}, {
|
||||
"cc:jurisdiction", "rdf:resource", TAG_CC_JURISDICTION}, {
|
||||
"cc:legalcode", "rdf:resource", TAG_CC_LEGALCODE}, {
|
||||
"cc:prohibits", "rdf:resource", TAG_CC_PROHIBITS}, {
|
||||
"cc:requires", "rdf:resource", TAG_CC_REQUIRES}, {
|
||||
"cc:permits", "rdf:resource", TAG_CC_PERMITS}, {
|
||||
"dc:creator", "rdf:resource", TAG_DC_CREATOR}, {
|
||||
"dc:source", "rdf:resource", TAG_DC_SOURCE}, {
|
||||
"dc:title", "xml:lang", TAG_DC_TITLE}, {
|
||||
"dc:description", "xml:lang", TAG_DC_DESCRIPTION}, {
|
||||
"dcq:hasVersion", NULL, TAG_DCQ_HAS_VERSION}, {
|
||||
"dcq:isReplacedBy", "rdf:resource", TAG_DCQ_IS_REPLACED_BY}, {
|
||||
"rdf:RDF", NULL, TAG_RDF_RDF}, {
|
||||
"rdf:Description", "rdf:about", TAG_RDF_DESCRIPTION},
|
||||
/* these three are just for by-nc-nd_2.0_jp_.rdf */
|
||||
{
|
||||
"dc:isBasedOn", "rdf:resource", TAG_DC_SOURCE}, {
|
||||
"dc:hasVersion", NULL, TAG_DCQ_HAS_VERSION}, {
|
||||
"dc:isReplacedBy", "rdf:resource", TAG_DCQ_IS_REPLACED_BY}
|
||||
};
|
||||
|
||||
static void
|
||||
parse_start (GMarkupParseContext * ctx, const gchar * element_name,
|
||||
const gchar ** attr_names, const gchar ** attr_vals,
|
||||
gpointer user_data, GError ** err)
|
||||
{
|
||||
License *license = user_data;
|
||||
const gchar *ref = NULL;
|
||||
int i;
|
||||
|
||||
for (i = 0; i < G_N_ELEMENTS (tag_map); ++i) {
|
||||
if (strcmp (element_name, tag_map[i].element_name) == 0)
|
||||
break;
|
||||
}
|
||||
|
||||
if (i == G_N_ELEMENTS (tag_map))
|
||||
g_error ("Unexpected tag '%s'\n", element_name);
|
||||
|
||||
if (tag_map[i].attribute == NULL)
|
||||
return;
|
||||
|
||||
if (!g_markup_collect_attributes (element_name, attr_names, attr_vals,
|
||||
err, G_MARKUP_COLLECT_STRING, tag_map[i].attribute, &ref,
|
||||
G_MARKUP_COLLECT_INVALID)) {
|
||||
return;
|
||||
}
|
||||
|
||||
switch (tag_map[i].element_tag) {
|
||||
case TAG_CC_LICENSE:
|
||||
if (!g_str_has_prefix (ref, "http://creativecommons.org/licenses/"))
|
||||
g_error ("Unexpected license reference: %s\n", ref);
|
||||
/* we assume one license per file, and CC license ref */
|
||||
g_assert (license->ref == NULL);
|
||||
license->ref = g_strdup (ref);
|
||||
break;
|
||||
case TAG_CC_JURISDICTION:
|
||||
if (!g_str_has_prefix (ref, "http://creativecommons.org/international/"))
|
||||
g_error ("Unknown license jurisdiction: %s\n", ref);
|
||||
/* we assume one jurisdiction per license */
|
||||
g_assert (license->jurisdiction == JURISDICTION_GENERIC);
|
||||
license->jurisdiction = ref_to_jurisdiction (ref);
|
||||
license->jurisdiction_suffix =
|
||||
g_strdup (ref + strlen ("http://creativecommons.org/international/"));
|
||||
break;
|
||||
case TAG_CC_LEGALCODE:
|
||||
if (!g_str_has_prefix (ref, "http://creativecommons.org/licenses/"))
|
||||
g_error ("Unexpected legalcode reference: %s\n", ref);
|
||||
/* we assume one legalcode per license */
|
||||
g_assert (license->legalcode == NULL);
|
||||
license->legalcode = g_strdup (ref);
|
||||
break;
|
||||
case TAG_DC_CREATOR:
|
||||
if (strcmp (ref, "http://creativecommons.org") == 0) {
|
||||
license->flags |= GST_TAG_LICENSE_CREATIVE_COMMONS_LICENSE;
|
||||
} else if (strcmp (ref, "http://fsf.org") == 0) {
|
||||
license->flags |= GST_TAG_LICENSE_FREE_SOFTWARE_FOUNDATION_LICENSE;
|
||||
} else {
|
||||
g_error ("Unknown license creator: %s\n", ref);
|
||||
}
|
||||
break;
|
||||
case TAG_CC_DEPRECATED_ON:
|
||||
break;
|
||||
case TAG_CC_PROHIBITS:
|
||||
case TAG_CC_REQUIRES:
|
||||
case TAG_CC_PERMITS:
|
||||
license->flags |= ref_to_flag (ref);
|
||||
break;
|
||||
case TAG_DC_TITLE:{
|
||||
gchar *cur_lang;
|
||||
|
||||
cur_lang = g_strdelimit (g_strdup (ref), "-", '_');
|
||||
license->cur_lang = g_intern_string (cur_lang);
|
||||
if (!g_list_find_custom (langs, cur_lang, (GCompareFunc) strcmp))
|
||||
langs = g_list_prepend (langs, (gpointer) license->cur_lang);
|
||||
|
||||
g_free (cur_lang);
|
||||
break;
|
||||
}
|
||||
case TAG_DC_DESCRIPTION:{
|
||||
gchar *cur_lang;
|
||||
|
||||
cur_lang = g_strdelimit (g_strdup (ref), "-", '_');
|
||||
license->cur_lang = g_intern_string (cur_lang);
|
||||
if (!g_list_find_custom (langs, cur_lang, (GCompareFunc) strcmp))
|
||||
langs = g_list_prepend (langs, (gpointer) license->cur_lang);
|
||||
|
||||
g_free (cur_lang);
|
||||
break;
|
||||
}
|
||||
case TAG_DCQ_IS_REPLACED_BY:
|
||||
/* we assume one replacer per license for now */
|
||||
g_assert (license->replaced_by == NULL);
|
||||
license->replaced_by = g_strdup (ref);
|
||||
break;
|
||||
case TAG_RDF_DESCRIPTION:
|
||||
if (!g_str_has_prefix (ref, "http://creativecommons.org/licenses/"))
|
||||
g_error ("Unexpected license reference: %s\n", ref);
|
||||
if (license->ref != NULL && strcmp (license->ref, ref) != 0) {
|
||||
gchar *f, *r = g_strdup (ref);
|
||||
|
||||
/* work around bug in some of the RDFs ... */
|
||||
if ((f = strstr (r, "by-nc-nd"))) {
|
||||
memcpy (f, "by-nd-nc", 8);
|
||||
}
|
||||
if (strcmp (license->ref, r) != 0) {
|
||||
g_error ("rdf:Description chunk for other than current license");
|
||||
}
|
||||
g_free (r);
|
||||
}
|
||||
break;
|
||||
case TAG_DC_SOURCE:
|
||||
if (!g_str_has_prefix (ref, "http://creativecommons.org/licenses/"))
|
||||
g_error ("Unexpected source reference: %s\n", ref);
|
||||
/* we assume one source (for jurisdiction-specific versions) */
|
||||
g_assert (license->source == NULL);
|
||||
license->source = g_strdup (ref);
|
||||
break;
|
||||
default:
|
||||
g_printerr ("unhandled start tag: %s\n", element_name);
|
||||
break;
|
||||
}
|
||||
}
|
||||
|
||||
static void
|
||||
parse_text (GMarkupParseContext * ctx, const gchar * text, gsize text_len,
|
||||
gpointer user_data, GError ** err)
|
||||
{
|
||||
License *license = user_data;
|
||||
const gchar *element_name, *found;
|
||||
int i;
|
||||
|
||||
element_name = g_markup_parse_context_get_element (ctx);
|
||||
for (i = 0; i < G_N_ELEMENTS (tag_map); ++i) {
|
||||
if (strcmp (element_name, tag_map[i].element_name) == 0)
|
||||
break;
|
||||
}
|
||||
|
||||
if (i == G_N_ELEMENTS (tag_map))
|
||||
g_error ("Unexpected tag '%s'\n", element_name);
|
||||
|
||||
switch (tag_map[i].element_tag) {
|
||||
case TAG_CC_LICENSE:
|
||||
case TAG_CC_JURISDICTION:
|
||||
case TAG_CC_LEGALCODE:
|
||||
case TAG_DC_CREATOR:
|
||||
case TAG_CC_PROHIBITS:
|
||||
case TAG_CC_REQUIRES:
|
||||
case TAG_CC_PERMITS:
|
||||
case TAG_RDF_RDF:
|
||||
case TAG_RDF_DESCRIPTION:
|
||||
break;
|
||||
case TAG_DC_TITLE:
|
||||
if (license->titles == NULL) {
|
||||
license->titles = g_hash_table_new (g_str_hash, g_str_equal);
|
||||
}
|
||||
g_hash_table_insert (license->titles, (gpointer) license->cur_lang,
|
||||
(gpointer) g_intern_string (text));
|
||||
break;
|
||||
case TAG_DC_DESCRIPTION:{
|
||||
gchar *txt = g_strdup (text);
|
||||
|
||||
if (license->descriptions == NULL) {
|
||||
license->descriptions = g_hash_table_new (g_str_hash, g_str_equal);
|
||||
}
|
||||
g_strdelimit (txt, "\n", ' ');
|
||||
g_hash_table_insert (license->descriptions, (gpointer) license->cur_lang,
|
||||
(gpointer) g_intern_string (txt));
|
||||
g_free (txt);
|
||||
break;
|
||||
}
|
||||
case TAG_DCQ_HAS_VERSION:
|
||||
/* we assume one version per license */
|
||||
g_assert (license->version == NULL);
|
||||
license->version = g_strdup (text);
|
||||
found = strstr (known_versions, license->version);
|
||||
if (found == NULL || found[strlen (license->version)] != '/')
|
||||
g_error ("Unexpected version '%s', please add to table.", text);
|
||||
break;
|
||||
case TAG_CC_DEPRECATED_ON:
|
||||
license->deprecated = TRUE;
|
||||
break;
|
||||
case TAG_DC_SOURCE: // FIXME
|
||||
default:
|
||||
g_print ("text (%s) (%s): '%s'\n", element_name, license->cur_lang, text);
|
||||
}
|
||||
}
|
||||
|
||||
static void
|
||||
parse_passthrough (GMarkupParseContext * ctx, const gchar * text, gsize len,
|
||||
gpointer user_data, GError ** err)
|
||||
{
|
||||
if (!g_str_has_prefix (text, "<?xml ")) {
|
||||
g_error ("Unexpected passthrough text: %s\n", text);
|
||||
}
|
||||
}
|
||||
|
||||
static void
|
||||
parse_error (GMarkupParseContext * ctx, GError * err, gpointer data)
|
||||
{
|
||||
g_error ("parse error: %s\n", err->message);
|
||||
}
|
||||
|
||||
static const GMarkupParser license_rdf_parser = {
|
||||
parse_start, NULL, parse_text, parse_passthrough, parse_error
|
||||
};
|
||||
|
||||
static void
|
||||
parse_license_rdf (const gchar * fn, const gchar * rdf)
|
||||
{
|
||||
GMarkupParseContext *ctx;
|
||||
License *license;
|
||||
GError *err = NULL;
|
||||
|
||||
if (!g_utf8_validate (rdf, -1, NULL)) {
|
||||
g_error ("%s is not valid UTF-8\n", fn);
|
||||
}
|
||||
|
||||
license = g_new0 (License, 1);
|
||||
|
||||
/* mark as generic until proven otherwise */
|
||||
license->jurisdiction = JURISDICTION_GENERIC;
|
||||
|
||||
ctx = g_markup_parse_context_new (&license_rdf_parser,
|
||||
G_MARKUP_TREAT_CDATA_AS_TEXT, license, NULL);
|
||||
|
||||
/* g_print ("Parsing %s\n", fn); */
|
||||
|
||||
if (!g_markup_parse_context_parse (ctx, rdf, -1, &err)) {
|
||||
g_error ("Error parsing file %s: %s\n", fn, err->message);
|
||||
}
|
||||
|
||||
licenses = g_list_append (licenses, license);
|
||||
|
||||
g_markup_parse_context_free (ctx);
|
||||
}
|
||||
|
||||
static void
|
||||
read_licenses (const gchar * licenses_dir)
|
||||
{
|
||||
const gchar *name;
|
||||
GError *err = NULL;
|
||||
GDir *dir;
|
||||
|
||||
dir = g_dir_open (licenses_dir, 0, &err);
|
||||
|
||||
if (dir == NULL)
|
||||
g_error ("Failed to g_dir_open('%s'): %s", licenses_dir, err->message);
|
||||
|
||||
while ((name = g_dir_read_name (dir))) {
|
||||
gchar *fn, *rdf;
|
||||
|
||||
fn = g_build_filename (licenses_dir, name, NULL);
|
||||
if (g_file_get_contents (fn, &rdf, NULL, &err)) {
|
||||
parse_license_rdf (fn, rdf);
|
||||
g_free (rdf);
|
||||
} else {
|
||||
g_printerr ("Could not read file '%s': %s\n", fn, err->message);
|
||||
g_error_free (err);
|
||||
err = NULL;
|
||||
}
|
||||
g_free (fn);
|
||||
}
|
||||
|
||||
g_dir_close (dir);
|
||||
}
|
||||
|
||||
static License *
|
||||
find_license (const gchar * ref)
|
||||
{
|
||||
GList *l;
|
||||
|
||||
if (!g_str_has_prefix (ref, "http://creativecommons.org/"))
|
||||
return NULL;
|
||||
|
||||
for (l = licenses; l != NULL; l = l->next) {
|
||||
License *license = l->data;
|
||||
|
||||
if (strcmp (license->ref, ref) == 0)
|
||||
return license;
|
||||
}
|
||||
|
||||
return NULL;
|
||||
}
|
||||
|
||||
static int
|
||||
license_ref_cmp (License * a, License * b)
|
||||
{
|
||||
return strcmp (a->ref, b->ref);
|
||||
}
|
||||
|
||||
#define STRING_TABLE_MAX_STRINGS 100
|
||||
typedef struct
|
||||
{
|
||||
GString *s;
|
||||
guint num_escaped;
|
||||
guint num_strings;
|
||||
guint indices[STRING_TABLE_MAX_STRINGS];
|
||||
gchar *strings[STRING_TABLE_MAX_STRINGS]; /* unescaped strings */
|
||||
} StringTable;
|
||||
|
||||
static StringTable *
|
||||
string_table_new (void)
|
||||
{
|
||||
StringTable *t = g_new0 (StringTable, 1);
|
||||
|
||||
t->s = g_string_new (NULL);
|
||||
return t;
|
||||
}
|
||||
|
||||
static void
|
||||
string_table_free (StringTable * t)
|
||||
{
|
||||
int i;
|
||||
|
||||
for (i = 0; i < t->num_strings; ++i)
|
||||
g_free (t->strings[i]);
|
||||
|
||||
g_string_free (t->s, TRUE);
|
||||
g_free (t);
|
||||
}
|
||||
|
||||
static guint
|
||||
string_table_add_string (StringTable * t, const gchar * str)
|
||||
{
|
||||
const gchar *s;
|
||||
guint idx, i;
|
||||
|
||||
/* check if we already have this string */
|
||||
for (i = 0; i < t->num_strings; ++i) {
|
||||
if (strcmp (t->strings[i], str) == 0)
|
||||
return t->indices[i];
|
||||
}
|
||||
|
||||
/* save current offset */
|
||||
idx = t->s->len;
|
||||
|
||||
/* adjust for fact that \000 is 4 chars now but will take up only 1 later */
|
||||
idx -= t->num_escaped * 3;
|
||||
|
||||
/* append one char at a time, making sure to escape UTF-8 characters */
|
||||
for (s = str; s != NULL && *s != '\0'; ++s) {
|
||||
if (g_ascii_isprint (*s) && *s != '"' && *s != '\\') {
|
||||
g_string_append_c (t->s, *s);
|
||||
} else {
|
||||
g_string_append_printf (t->s, "\\%03o", (unsigned char) *s);
|
||||
t->num_escaped++;
|
||||
}
|
||||
}
|
||||
g_string_append (t->s, "\\000");
|
||||
t->num_escaped++;
|
||||
|
||||
t->indices[t->num_strings] = idx;
|
||||
t->strings[t->num_strings] = g_strdup (str);
|
||||
++t->num_strings;
|
||||
|
||||
return idx;
|
||||
}
|
||||
|
||||
static void
|
||||
string_table_print (StringTable * t)
|
||||
{
|
||||
const gchar *s;
|
||||
|
||||
s = t->s->str;
|
||||
while (s != NULL && *s != '\0') {
|
||||
gchar line[74], *lastesc;
|
||||
guint left;
|
||||
|
||||
left = strlen (s);
|
||||
g_strlcpy (line, s, MIN (left, sizeof (line)));
|
||||
s += sizeof (line) - 1;
|
||||
/* avoid partial escaped codes at the end of a line */
|
||||
if ((lastesc = strrchr (line, '\\')) && strlen (lastesc) < 4) {
|
||||
s -= strlen (lastesc);
|
||||
*lastesc = '\0';
|
||||
}
|
||||
g_print (" \"%s\"", line);
|
||||
if (left < 74)
|
||||
break;
|
||||
g_print ("\n");
|
||||
}
|
||||
g_print (";\n");
|
||||
}
|
||||
|
||||
/* skip translation if translated string for e.g. "fr_ca" is same as for "fr" */
|
||||
static gboolean
|
||||
skip_translation (GHashTable * ht_strings, const gchar * lang,
|
||||
const gchar * trans)
|
||||
{
|
||||
const gchar *simple_trans;
|
||||
gchar *simple_lang;
|
||||
|
||||
if (strchr (lang, '_') == NULL)
|
||||
return FALSE;
|
||||
|
||||
simple_lang = g_strdup (lang);
|
||||
g_strdelimit (simple_lang, "_", '\0');
|
||||
|
||||
simple_trans = g_hash_table_lookup (ht_strings, (gpointer) simple_lang);
|
||||
g_free (simple_lang);
|
||||
|
||||
return (simple_trans != NULL && strcmp (trans, simple_trans) == 0);
|
||||
}
|
||||
|
||||
static GVariant *
|
||||
create_translation_dict (GHashTable * ht_strings, const gchar * en)
|
||||
{
|
||||
GVariantBuilder array;
|
||||
guint count = 0;
|
||||
GList *l;
|
||||
|
||||
g_variant_builder_init (&array, G_VARIANT_TYPE_ARRAY);
|
||||
|
||||
for (l = langs; l != NULL; l = l->next) {
|
||||
const gchar *trans, *lang;
|
||||
|
||||
lang = (const gchar *) l->data;
|
||||
trans = g_hash_table_lookup (ht_strings, (gpointer) lang);
|
||||
if (trans != NULL && *trans != '\0' && strcmp (en, trans) != 0 &&
|
||||
!skip_translation (ht_strings, lang, trans)) {
|
||||
g_print ("%s (%s) => %s\n", en, lang, trans);
|
||||
g_variant_builder_add_value (&array,
|
||||
g_variant_new_dict_entry (g_variant_new_string (lang),
|
||||
g_variant_new_string (trans)));
|
||||
++count;
|
||||
}
|
||||
}
|
||||
|
||||
if (count == 0) {
|
||||
g_variant_builder_clear (&array);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
return g_variant_builder_end (&array);
|
||||
}
|
||||
|
||||
static void
|
||||
write_translations_dictionary (GList * licenses, const gchar * dict_filename)
|
||||
{
|
||||
/* maps C string => (dictionary of: locale => translation) */
|
||||
GVariantBuilder array;
|
||||
/* maps C string => boolean (if it's in the dictionary already */
|
||||
GHashTable *translations;
|
||||
GVariant *var;
|
||||
GList *l;
|
||||
FILE *f;
|
||||
|
||||
/* sort langs for prettiness / to make variant dumps easier to read */
|
||||
langs = g_list_sort (langs, (GCompareFunc) strcmp);
|
||||
|
||||
g_variant_builder_init (&array, G_VARIANT_TYPE_ARRAY);
|
||||
|
||||
translations = g_hash_table_new (g_str_hash, g_str_equal);
|
||||
|
||||
for (l = licenses; l != NULL; l = l->next) {
|
||||
const gchar *en;
|
||||
License *license;
|
||||
|
||||
license = l->data;
|
||||
|
||||
if (license->packed_into_source)
|
||||
continue;
|
||||
|
||||
/* add title + translations */
|
||||
en = g_hash_table_lookup (license->titles, "en");
|
||||
g_assert (en != NULL);
|
||||
|
||||
/* check if we already have added translations for this string */
|
||||
if (!g_hash_table_lookup (translations, (gpointer) en)) {
|
||||
GVariant *trans;
|
||||
|
||||
trans = create_translation_dict (license->titles, en);
|
||||
if (trans != NULL) {
|
||||
g_variant_builder_add_value (&array,
|
||||
g_variant_new_dict_entry (g_variant_new_string (en), trans));
|
||||
g_hash_table_insert (translations, (gpointer) en,
|
||||
GINT_TO_POINTER (TRUE));
|
||||
}
|
||||
}
|
||||
|
||||
/* add description + translations */
|
||||
if (license->descriptions == NULL)
|
||||
continue;
|
||||
|
||||
en = g_hash_table_lookup (license->descriptions, "en");
|
||||
g_assert (en != NULL);
|
||||
|
||||
/* check if we already have added translations for this string */
|
||||
if (!g_hash_table_lookup (translations, (gpointer) en)) {
|
||||
GVariant *trans;
|
||||
|
||||
trans = create_translation_dict (license->descriptions, en);
|
||||
if (trans != NULL) {
|
||||
g_variant_builder_add_value (&array,
|
||||
g_variant_new_dict_entry (g_variant_new_string (en), trans));
|
||||
g_hash_table_insert (translations, (gpointer) en,
|
||||
GINT_TO_POINTER (TRUE));
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
var = g_variant_builder_end (&array);
|
||||
|
||||
f = fopen (dict_filename, "wb");
|
||||
if (fwrite (g_variant_get_data (var), g_variant_get_size (var), 1, f) != 1) {
|
||||
g_error ("failed to write dict to file: %s", g_strerror (errno));
|
||||
}
|
||||
fclose (f);
|
||||
|
||||
g_printerr ("Wrote dictionary to %s, size: %u, type: %s\n", dict_filename,
|
||||
(guint) g_variant_get_size (var), (gchar *) g_variant_get_type (var));
|
||||
|
||||
g_variant_unref (var);
|
||||
g_hash_table_destroy (translations);
|
||||
}
|
||||
|
||||
int
|
||||
main (int argc, char **argv)
|
||||
{
|
||||
gchar *translation_dict_fn = NULL;
|
||||
GOptionContext *ctx;
|
||||
GOptionEntry options[] = {
|
||||
{"translation-dictionary", 0, 0, G_OPTION_ARG_FILENAME,
|
||||
&translation_dict_fn, "Filename of translations dictionary to write",
|
||||
NULL},
|
||||
{NULL}
|
||||
};
|
||||
StringTable *string_table;
|
||||
GError *err = NULL;
|
||||
GList *l;
|
||||
int idx = 0;
|
||||
|
||||
g_type_init ();
|
||||
|
||||
ctx = g_option_context_new ("");
|
||||
g_option_context_add_main_entries (ctx, options, NULL);
|
||||
if (!g_option_context_parse (ctx, &argc, &argv, &err)) {
|
||||
g_printerr ("Error initializing: %s\n", err->message);
|
||||
exit (1);
|
||||
}
|
||||
g_option_context_free (ctx);
|
||||
|
||||
read_licenses (LIBLICENSE_DATA_PREFIX);
|
||||
|
||||
g_printerr ("%d licenses\n", g_list_length (licenses));
|
||||
|
||||
unknown_sources = g_hash_table_new (g_str_hash, g_str_equal);
|
||||
|
||||
for (l = licenses; l != NULL; l = l->next) {
|
||||
License *license = l->data;
|
||||
|
||||
/* if the license has as source, check if we can 'pack' it into the
|
||||
* original license as a jurisdiction-specific variant */
|
||||
if (license->source != NULL) {
|
||||
License *source = find_license (license->source);
|
||||
|
||||
if (source != NULL) {
|
||||
if (source->flags != license->flags) {
|
||||
g_printerr ("Source and derived license have different flags:\n"
|
||||
"\t0x%08x : %s\n\t0x%08x : %s\n", source->flags, source->ref,
|
||||
license->flags, license->ref);
|
||||
source = NULL;
|
||||
} else {
|
||||
if (source->descriptions == NULL) {
|
||||
/* neither should the derived one then */
|
||||
g_assert (license->descriptions == NULL);
|
||||
} else {
|
||||
/* make sure we're not settling for fewer descriptions than
|
||||
* there are */
|
||||
g_assert (g_hash_table_size (license->titles) <=
|
||||
g_hash_table_size (source->titles));
|
||||
g_assert (g_hash_table_size (license->descriptions) <=
|
||||
g_hash_table_size (source->descriptions));
|
||||
}
|
||||
}
|
||||
} else {
|
||||
/* a source is referenced that we haven't encountered
|
||||
* (possibly a referencing bug? seems to happen e.g. when there's a
|
||||
* 2.1 version of a jurisdiction license and it refers to a 2.1
|
||||
* source version, but there's only a 2.0 or 2.5 source version. So
|
||||
* maybe it's supposed to refer to the 2.0 source then, who knows) */
|
||||
if (!g_hash_table_lookup (unknown_sources, license->source)) {
|
||||
g_printerr ("Unknown source license %s\n", license->source);
|
||||
g_hash_table_insert (unknown_sources, g_strdup (license->source),
|
||||
GUINT_TO_POINTER (TRUE));
|
||||
}
|
||||
/* g_print ("Unknown source license %s referenced from %s\n",
|
||||
* license->source, license->ref); */
|
||||
}
|
||||
|
||||
/* should we pack this into the source or not */
|
||||
if (source != NULL) {
|
||||
source->jurisdiction |= license->jurisdiction;
|
||||
source->derived = g_list_insert_sorted (source->derived, license,
|
||||
(GCompareFunc) license_ref_cmp);
|
||||
license->packed_into_source = TRUE;
|
||||
}
|
||||
} else {
|
||||
/* no source license */
|
||||
if (license->titles == NULL)
|
||||
g_error ("License has no titles: %s\n", license->ref);
|
||||
if (license->descriptions == NULL);
|
||||
g_printerr ("License %s has no descriptions!\n", license->ref);
|
||||
}
|
||||
}
|
||||
|
||||
licenses = g_list_sort (licenses, (GCompareFunc) license_ref_cmp);
|
||||
|
||||
string_table = string_table_new ();
|
||||
|
||||
g_print ("/* created by mklicensestables.c */\n");
|
||||
g_print ("static const struct {\n"
|
||||
" /* jurisdictions in addition to the generic version, bitfield */\n"
|
||||
" const guint64 jurisdictions;\n"
|
||||
" const GstTagLicenseFlags flags;\n"
|
||||
" /* the bit after http://creativecommons.org/licenses/ */\n"
|
||||
" const gchar ref[18];\n"
|
||||
" gint16 title_idx; /* index in string table */\n"
|
||||
" gint16 desc_idx; /* index in string table */\n"
|
||||
"} licenses[] = {\n");
|
||||
|
||||
for (l = licenses; l != NULL; l = l->next) {
|
||||
const gchar *title_en, *desc_en;
|
||||
int idx_title, idx_desc;
|
||||
License *license;
|
||||
|
||||
license = l->data;
|
||||
|
||||
if (license->packed_into_source)
|
||||
continue;
|
||||
|
||||
title_en = g_hash_table_lookup (license->titles, "en");
|
||||
g_assert (title_en != NULL);
|
||||
idx_title = string_table_add_string (string_table, title_en);
|
||||
g_assert (idx_title <= G_MAXINT16);
|
||||
|
||||
if (license->descriptions != NULL) {
|
||||
desc_en = g_hash_table_lookup (license->descriptions, "en");
|
||||
g_assert (desc_en != NULL);
|
||||
idx_desc = string_table_add_string (string_table, desc_en);
|
||||
g_assert (idx_desc <= G_MAXINT16);
|
||||
} else {
|
||||
idx_desc = -1;
|
||||
}
|
||||
|
||||
/* output comments with license refs covered by the next stanza */
|
||||
if (license->derived != NULL) {
|
||||
GList *d;
|
||||
|
||||
g_print (" /* %2d %s\n", idx, license->ref);
|
||||
|
||||
for (d = license->derived; d != NULL; d = d->next) {
|
||||
License *derived_license = d->data;
|
||||
|
||||
g_print (" * %2d %s%s\n", idx, derived_license->ref,
|
||||
(d->next == NULL) ? " */" : "");
|
||||
}
|
||||
} else {
|
||||
g_print (" /* %2d %s */\n", idx, license->ref);
|
||||
}
|
||||
/* output essential data */
|
||||
{
|
||||
gchar *ref;
|
||||
|
||||
ref =
|
||||
g_strdup (license->ref +
|
||||
strlen ("http://creativecommons.org/licenses/"));
|
||||
|
||||
/* remove jurisdiction suffix from ref if this is non-generic, since
|
||||
* the suffix is already contained in the jurisdiction flags */
|
||||
if (license->jurisdiction_suffix != NULL) {
|
||||
gsize suffix_len = strlen (license->jurisdiction_suffix);
|
||||
gchar *cutoff;
|
||||
|
||||
cutoff = ref + strlen (ref) - suffix_len;
|
||||
g_assert (!strncmp (cutoff, license->jurisdiction_suffix, suffix_len));
|
||||
g_assert (cutoff[suffix_len - 1] == '/');
|
||||
g_assert (cutoff[suffix_len] == '\0');
|
||||
*cutoff = '\0';
|
||||
}
|
||||
|
||||
g_print (" { 0x%016" G_GINT64_MODIFIER "x, 0x%08x, \"%s\", %d, %d }%s\n",
|
||||
license->jurisdiction, license->flags, ref, idx_title, idx_desc,
|
||||
(l->next != NULL) ? "," : "");
|
||||
|
||||
g_free (ref);
|
||||
}
|
||||
++idx;
|
||||
}
|
||||
g_print ("};\n");
|
||||
|
||||
g_print ("\nstatic const gchar license_strings[] =\n");
|
||||
string_table_print (string_table);
|
||||
string_table_free (string_table);
|
||||
string_table = NULL;
|
||||
|
||||
if (translation_dict_fn != NULL) {
|
||||
write_translations_dictionary (licenses, translation_dict_fn);
|
||||
}
|
||||
|
||||
return 0;
|
||||
}
|
Loading…
Reference in a new issue