]> git.ipfire.org Git - thirdparty/git.git/blame - gettext.c
utf8: fix overflow when returning string width
[thirdparty/git.git] / gettext.c
CommitLineData
30955229
JN
1/*
2 * Copyright (c) 2010 Ævar Arnfjörð Bjarmason
3 */
4
226c0ddd 5#include "cache.h"
92034a9c 6#include "exec-cmd.h"
30955229 7#include "gettext.h"
754395d3
NTND
8#include "strbuf.h"
9#include "utf8.h"
6cdccfce 10#include "config.h"
30955229 11
5e9637c6
ÆAB
12#ifndef NO_GETTEXT
13# include <locale.h>
14# include <libintl.h>
090d1e84
KB
15# ifdef GIT_WINDOWS_NATIVE
16
17static const char *locale_charset(void)
18{
19 const char *env = getenv("LC_ALL"), *dot;
20
21 if (!env || !*env)
22 env = getenv("LC_CTYPE");
23 if (!env || !*env)
24 env = getenv("LANG");
25
26 if (!env)
27 return "UTF-8";
28
29 dot = strchr(env, '.');
30 return !dot ? env : dot + 1;
31}
32
33# elif defined HAVE_LIBCHARSET_H
5e9637c6
ÆAB
34# include <libcharset.h>
35# else
36# include <langinfo.h>
37# define locale_charset() nl_langinfo(CODESET)
38# endif
39#endif
40
e8c16726
NTND
41static const char *charset;
42
93f7d910
JK
43/*
44 * Guess the user's preferred languages from the value in LANGUAGE environment
45 * variable and LC_MESSAGES locale category if NO_GETTEXT is not defined.
46 *
47 * The result can be a colon-separated list like "ko:ja:en".
48 */
49const char *get_preferred_languages(void)
50{
51 const char *retval;
52
53 retval = getenv("LANGUAGE");
54 if (retval && *retval)
55 return retval;
56
57#ifndef NO_GETTEXT
58 retval = setlocale(LC_MESSAGES, NULL);
59 if (retval && *retval &&
60 strcmp(retval, "C") &&
61 strcmp(retval, "POSIX"))
62 return retval;
63#endif
64
65 return NULL;
66}
67
30955229
JN
68int use_gettext_poison(void)
69{
70 static int poison_requested = -1;
1ff750b1
ÆAB
71 if (poison_requested == -1)
72 poison_requested = git_env_bool("GIT_TEST_GETTEXT_POISON", 0);
30955229
JN
73 return poison_requested;
74}
5e9637c6
ÆAB
75
76#ifndef NO_GETTEXT
9c0495d2
NTND
77static int test_vsnprintf(const char *fmt, ...)
78{
79 char buf[26];
80 int ret;
81 va_list ap;
82 va_start(ap, fmt);
83 ret = vsnprintf(buf, sizeof(buf), fmt, ap);
84 va_end(ap);
85 return ret;
86}
87
5e9637c6
ÆAB
88static void init_gettext_charset(const char *domain)
89{
5e9637c6
ÆAB
90 setlocale(LC_CTYPE, "");
91 charset = locale_charset();
92 bind_textdomain_codeset(domain, charset);
9371c0e9
ÆAB
93
94 /*
95 * Work around an old bug fixed in glibc 2.17 (released on
96 * 2012-12-24), at the cost of potentially making translated
97 * messages from external functions like perror() emitted in
98 * the wrong encoding.
99 *
100 * The bug affected e.g. git.git's own 7eb93c89651 ([PATCH]
101 * Simplify git script, 2005-09-07), which is the origin of
102 * the "David_K\345gedal" test string.
103 *
104 * See a much longer comment added to this file in 5e9637c6297
105 * (i18n: add infrastructure for translating Git with gettext,
106 * 2011-11-18) for more details.
107 */
9c0495d2
NTND
108 if (test_vsnprintf("%.*s", 13, "David_K\345gedal") < 0)
109 setlocale(LC_CTYPE, "C");
5e9637c6
ÆAB
110}
111
112void git_setup_gettext(void)
113{
226c0ddd 114 const char *podir = getenv(GIT_TEXT_DOMAIN_DIR_ENVIRONMENT);
0210231b 115 char *p = NULL;
5e9637c6
ÆAB
116
117 if (!podir)
0210231b 118 podir = p = system_path(GIT_LOCALE_PATH);
226c0ddd 119
6cdccfce
ÆAB
120 use_gettext_poison(); /* getenv() reentrancy paranoia */
121
0210231b
JS
122 if (!is_directory(podir)) {
123 free(p);
cc5e1bf9 124 return;
0210231b 125 }
226c0ddd 126
5e9637c6
ÆAB
127 bindtextdomain("git", podir);
128 setlocale(LC_MESSAGES, "");
aa1462cc 129 setlocale(LC_TIME, "");
5e9637c6
ÆAB
130 init_gettext_charset("git");
131 textdomain("git");
0210231b
JS
132
133 free(p);
5e9637c6 134}
754395d3
NTND
135
136/* return the number of columns of string 's' in current locale */
137int gettext_width(const char *s)
138{
139 static int is_utf8 = -1;
140 if (is_utf8 == -1)
e8c16726 141 is_utf8 = is_utf8_locale();
754395d3
NTND
142
143 return is_utf8 ? utf8_strwidth(s) : strlen(s);
144}
5e9637c6 145#endif
e8c16726
NTND
146
147int is_utf8_locale(void)
148{
149#ifdef NO_GETTEXT
150 if (!charset) {
151 const char *env = getenv("LC_ALL");
152 if (!env || !*env)
153 env = getenv("LC_CTYPE");
154 if (!env || !*env)
155 env = getenv("LANG");
156 if (!env)
157 env = "";
158 if (strchr(env, '.'))
159 env = strchr(env, '.') + 1;
160 charset = xstrdup(env);
161 }
162#endif
163 return is_encoding_utf8(charset);
164}