1 /*
   2  * Copyright (c) 1998, 2018, Oracle and/or its affiliates. All rights reserved.
   3  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
   4  *
   5  * This code is free software; you can redistribute it and/or modify it
   6  * under the terms of the GNU General Public License version 2 only, as
   7  * published by the Free Software Foundation.  Oracle designates this
   8  * particular file as subject to the "Classpath" exception as provided
   9  * by Oracle in the LICENSE file that accompanied this code.
  10  *
  11  * This code is distributed in the hope that it will be useful, but WITHOUT
  12  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  13  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  14  * version 2 for more details (a copy is included in the LICENSE file that
  15  * accompanied this code).
  16  *
  17  * You should have received a copy of the GNU General Public License version
  18  * 2 along with this work; if not, write to the Free Software Foundation,
  19  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  20  *
  21  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  22  * or visit www.oracle.com if you need additional information or have any
  23  * questions.
  24  */
  25 
  26 #if defined(__linux__) || defined(_ALLBSD_SOURCE)
  27 #include <stdio.h>
  28 #include <ctype.h>
  29 #endif
  30 #include <pwd.h>
  31 #include <locale.h>
  32 #ifndef ARCHPROPNAME
  33 #error "The macro ARCHPROPNAME has not been defined"
  34 #endif
  35 #include <sys/utsname.h>        /* For os_name and os_version */
  36 #include <langinfo.h>           /* For nl_langinfo */
  37 #include <stdlib.h>
  38 #include <string.h>
  39 #include <sys/types.h>
  40 #include <unistd.h>
  41 #include <sys/param.h>
  42 #include <time.h>
  43 #include <errno.h>
  44 
  45 #ifdef MACOSX
  46 #include "java_props_macosx.h"
  47 #endif
  48 
  49 #if defined(_ALLBSD_SOURCE)
  50 #if !defined(P_tmpdir)
  51 #include <paths.h>
  52 #define P_tmpdir _PATH_VARTMP
  53 #endif
  54 #endif
  55 
  56 #include "locale_str.h"
  57 #include "java_props.h"
  58 
  59 #if !defined(_ALLBSD_SOURCE)
  60 #ifdef __linux__
  61   #ifndef CODESET
  62   #define CODESET _NL_CTYPE_CODESET_NAME
  63   #endif
  64 #else
  65 #ifdef ALT_CODESET_KEY
  66 #define CODESET ALT_CODESET_KEY
  67 #endif
  68 #endif
  69 #endif /* !_ALLBSD_SOURCE */
  70 
  71 /* Take an array of string pairs (map of key->value) and a string (key).
  72  * Examine each pair in the map to see if the first string (key) matches the
  73  * string.  If so, store the second string of the pair (value) in the value and
  74  * return 1.  Otherwise do nothing and return 0.  The end of the map is
  75  * indicated by an empty string at the start of a pair (key of "").
  76  */
  77 static int
  78 mapLookup(char* map[], const char* key, char** value) {
  79     int i;
  80     for (i = 0; strcmp(map[i], ""); i += 2){
  81         if (!strcmp(key, map[i])){
  82             *value = map[i + 1];
  83             return 1;
  84         }
  85     }
  86     return 0;
  87 }
  88 
  89 #ifndef P_tmpdir
  90 #define P_tmpdir "/var/tmp"
  91 #endif
  92 
  93 static int ParseLocale(JNIEnv* env, int cat, char ** std_language, char ** std_script,
  94                        char ** std_country, char ** std_variant, char ** std_encoding) {
  95     char *temp = NULL;
  96     char *language = NULL, *country = NULL, *variant = NULL,
  97          *encoding = NULL;
  98     char *p, *encoding_variant, *old_temp, *old_ev;
  99     char *lc;
 100 
 101     /* Query the locale set for the category */
 102 
 103 #ifdef MACOSX
 104     lc = setupMacOSXLocale(cat); // malloc'd memory, need to free
 105 #else
 106     lc = setlocale(cat, NULL);
 107 #endif
 108 
 109 #ifndef __linux__
 110     if (lc == NULL) {
 111         return 0;
 112     }
 113 
 114     temp = malloc(strlen(lc) + 1);
 115     if (temp == NULL) {
 116 #ifdef MACOSX
 117         free(lc); // malloced memory
 118 #endif
 119         JNU_ThrowOutOfMemoryError(env, NULL);
 120         return 0;
 121     }
 122 
 123     if (cat == LC_CTYPE) {
 124         /*
 125          * Workaround for Solaris bug 4201684: Xlib doesn't like @euro
 126          * locales. Since we don't depend on the libc @euro behavior,
 127          * we just remove the qualifier.
 128          * On Linux, the bug doesn't occur; on the other hand, @euro
 129          * is needed there because it's a shortcut that also determines
 130          * the encoding - without it, we wouldn't get ISO-8859-15.
 131          * Therefore, this code section is Solaris-specific.
 132          */
 133         strcpy(temp, lc);
 134         p = strstr(temp, "@euro");
 135         if (p != NULL) {
 136             *p = '\0';
 137             setlocale(LC_ALL, temp);
 138         }
 139     }
 140 #else
 141     if (lc == NULL || !strcmp(lc, "C") || !strcmp(lc, "POSIX")) {
 142         lc = "en_US";
 143     }
 144 
 145     temp = malloc(strlen(lc) + 1);
 146     if (temp == NULL) {
 147         JNU_ThrowOutOfMemoryError(env, NULL);
 148         return 0;
 149     }
 150 
 151 #endif
 152 
 153     /*
 154      * locale string format in Solaris is
 155      * <language name>_<country name>.<encoding name>@<variant name>
 156      * <country name>, <encoding name>, and <variant name> are optional.
 157      */
 158 
 159     strcpy(temp, lc);
 160 #ifdef MACOSX
 161     free(lc); // malloced memory
 162 #endif
 163     /* Parse the language, country, encoding, and variant from the
 164      * locale.  Any of the elements may be missing, but they must occur
 165      * in the order language_country.encoding@variant, and must be
 166      * preceded by their delimiter (except for language).
 167      *
 168      * If the locale name (without .encoding@variant, if any) matches
 169      * any of the names in the locale_aliases list, map it to the
 170      * corresponding full locale name.  Most of the entries in the
 171      * locale_aliases list are locales that include a language name but
 172      * no country name, and this facility is used to map each language
 173      * to a default country if that's possible.  It's also used to map
 174      * the Solaris locale aliases to their proper Java locale IDs.
 175      */
 176 
 177     encoding_variant = malloc(strlen(temp)+1);
 178     if (encoding_variant == NULL) {
 179         free(temp);
 180         JNU_ThrowOutOfMemoryError(env, NULL);
 181         return 0;
 182     }
 183 
 184     if ((p = strchr(temp, '.')) != NULL) {
 185         strcpy(encoding_variant, p); /* Copy the leading '.' */
 186         *p = '\0';
 187     } else if ((p = strchr(temp, '@')) != NULL) {
 188         strcpy(encoding_variant, p); /* Copy the leading '@' */
 189         *p = '\0';
 190     } else {
 191         *encoding_variant = '\0';
 192     }
 193 
 194     if (mapLookup(locale_aliases, temp, &p)) {
 195         old_temp = temp;
 196         temp = realloc(temp, strlen(p)+1);
 197         if (temp == NULL) {
 198             free(old_temp);
 199             free(encoding_variant);
 200             JNU_ThrowOutOfMemoryError(env, NULL);
 201             return 0;
 202         }
 203         strcpy(temp, p);
 204         old_ev = encoding_variant;
 205         encoding_variant = realloc(encoding_variant, strlen(temp)+1);
 206         if (encoding_variant == NULL) {
 207             free(old_ev);
 208             free(temp);
 209             JNU_ThrowOutOfMemoryError(env, NULL);
 210             return 0;
 211         }
 212         // check the "encoding_variant" again, if any.
 213         if ((p = strchr(temp, '.')) != NULL) {
 214             strcpy(encoding_variant, p); /* Copy the leading '.' */
 215             *p = '\0';
 216         } else if ((p = strchr(temp, '@')) != NULL) {
 217             strcpy(encoding_variant, p); /* Copy the leading '@' */
 218             *p = '\0';
 219         }
 220     }
 221 
 222     language = temp;
 223     if ((country = strchr(temp, '_')) != NULL) {
 224         *country++ = '\0';
 225     }
 226 
 227     p = encoding_variant;
 228     if ((encoding = strchr(p, '.')) != NULL) {
 229         p[encoding++ - p] = '\0';
 230         p = encoding;
 231     }
 232     if ((variant = strchr(p, '@')) != NULL) {
 233         p[variant++ - p] = '\0';
 234     }
 235 
 236     /* Normalize the language name */
 237     if (std_language != NULL) {
 238         *std_language = "en";
 239         if (language != NULL && mapLookup(language_names, language, std_language) == 0) {
 240             *std_language = malloc(strlen(language)+1);
 241             strcpy(*std_language, language);
 242         }
 243     }
 244 
 245     /* Normalize the country name */
 246     if (std_country != NULL && country != NULL) {
 247         if (mapLookup(country_names, country, std_country) == 0) {
 248             *std_country = malloc(strlen(country)+1);
 249             strcpy(*std_country, country);
 250         }
 251     }
 252 
 253     /* Normalize the script and variant name.  Note that we only use
 254      * variants listed in the mapping array; others are ignored.
 255      */
 256     if (variant != NULL) {
 257         if (std_script != NULL) {
 258             mapLookup(script_names, variant, std_script);
 259         }
 260 
 261         if (std_variant != NULL) {
 262             mapLookup(variant_names, variant, std_variant);
 263         }
 264     }
 265 
 266     /* Normalize the encoding name.  Note that we IGNORE the string
 267      * 'encoding' extracted from the locale name above.  Instead, we use the
 268      * more reliable method of calling nl_langinfo(CODESET).  This function
 269      * returns an empty string if no encoding is set for the given locale
 270      * (e.g., the C or POSIX locales); we use the default ISO 8859-1
 271      * converter for such locales.
 272      */
 273     if (std_encoding != NULL) {
 274         /* OK, not so reliable - nl_langinfo() gives wrong answers on
 275          * Euro locales, in particular. */
 276         if (strcmp(p, "ISO8859-15") == 0)
 277             p = "ISO8859-15";
 278         else
 279             p = nl_langinfo(CODESET);
 280 
 281         /* Convert the bare "646" used on Solaris to a proper IANA name */
 282         if (strcmp(p, "646") == 0)
 283             p = "ISO646-US";
 284 
 285         /* return same result nl_langinfo would return for en_UK,
 286          * in order to use optimizations. */
 287         *std_encoding = (*p != '\0') ? p : "ISO8859-1";
 288 
 289 #ifdef __linux__
 290         /*
 291          * Remap the encoding string to a different value for japanese
 292          * locales on linux so that customized converters are used instead
 293          * of the default converter for "EUC-JP". The customized converters
 294          * omit support for the JIS0212 encoding which is not supported by
 295          * the variant of "EUC-JP" encoding used on linux
 296          */
 297         if (strcmp(p, "EUC-JP") == 0) {
 298             *std_encoding = "EUC-JP-LINUX";
 299         }
 300 #endif
 301 
 302 #ifdef _AIX
 303         if (strcmp(p, "big5") == 0) {
 304             /* On AIX Traditional Chinese Big5 codeset is mapped to IBM-950 */
 305             *std_encoding = "IBM-950";
 306         } else if (strcmp(p, "IBM-943") == 0) {
 307             /*
 308              * On AIX, IBM-943 is mapped to IBM-943C in which symbol 'yen' and
 309              * 'overline' are replaced with 'backslash' and 'tilde' from ASCII
 310              * making first 96 code points same as ASCII.
 311              */
 312             *std_encoding = "IBM-943C";
 313         }
 314 #endif
 315 
 316 #ifdef __solaris__
 317         if (strcmp(p,"eucJP") == 0) {
 318             /* For Solaris use customized vendor defined character
 319              * customized EUC-JP converter
 320              */
 321             *std_encoding = "eucJP-open";
 322         } else if (strcmp(p, "Big5") == 0 || strcmp(p, "BIG5") == 0) {
 323             /*
 324              * Remap the encoding string to Big5_Solaris which augments
 325              * the default converter for Solaris Big5 locales to include
 326              * seven additional ideographic characters beyond those included
 327              * in the Java "Big5" converter.
 328              */
 329             *std_encoding = "Big5_Solaris";
 330         } else if (strcmp(p, "Big5-HKSCS") == 0) {
 331             /*
 332              * Solaris uses HKSCS2001
 333              */
 334             *std_encoding = "Big5-HKSCS-2001";
 335         }
 336 #endif
 337 #ifdef MACOSX
 338         /*
 339          * For the case on MacOS X where encoding is set to US-ASCII, but we
 340          * don't have any encoding hints from LANG/LC_ALL/LC_CTYPE, use UTF-8
 341          * instead.
 342          *
 343          * The contents of ASCII files will still be read and displayed
 344          * correctly, but so will files containing UTF-8 characters beyond the
 345          * standard ASCII range.
 346          *
 347          * Specifically, this allows apps launched by double-clicking a .jar
 348          * file to correctly read UTF-8 files using the default encoding (see
 349          * 8011194).
 350          */
 351         const char* env_lang = getenv("LANG");
 352         const char* env_lc_all = getenv("LC_ALL");
 353         const char* env_lc_ctype = getenv("LC_CTYPE");
 354 
 355         if (strcmp(p,"US-ASCII") == 0 &&
 356             (env_lang == NULL || strlen(env_lang) == 0) &&
 357             (env_lc_all == NULL || strlen(env_lc_all) == 0) &&
 358             (env_lc_ctype == NULL || strlen(env_lc_ctype) == 0)) {
 359             *std_encoding = "UTF-8";
 360         }
 361 #endif
 362     }
 363 
 364     free(temp);
 365     free(encoding_variant);
 366 
 367     return 1;
 368 }
 369 
 370 /* This function gets called very early, before VM_CALLS are setup.
 371  * Do not use any of the VM_CALLS entries!!!
 372  */
 373 java_props_t *
 374 GetJavaProperties(JNIEnv *env)
 375 {
 376     static java_props_t sprops;
 377     char *v; /* tmp var */
 378 
 379     if (sprops.user_dir) {
 380         return &sprops;
 381     }
 382 
 383     /* tmp dir */
 384     sprops.tmp_dir = P_tmpdir;
 385 #ifdef MACOSX
 386     /* darwin has a per-user temp dir */
 387     static char tmp_path[PATH_MAX];
 388     int pathSize = confstr(_CS_DARWIN_USER_TEMP_DIR, tmp_path, PATH_MAX);
 389     if (pathSize > 0 && pathSize <= PATH_MAX) {
 390         sprops.tmp_dir = tmp_path;
 391     }
 392 #endif /* MACOSX */
 393 
 394     /* patches/service packs installed */
 395     sprops.patch_level = NULL;      // leave it undefined
 396 
 397 #ifdef SI_ISALIST
 398     /* supported instruction sets */
 399     {
 400         char list[258];
 401         sysinfo(SI_ISALIST, list, sizeof(list));
 402         sprops.cpu_isalist = strdup(list);
 403     }
 404 #else
 405     sprops.cpu_isalist = NULL;
 406 #endif
 407 
 408     /* endianness of platform */
 409     {
 410         unsigned int endianTest = 0xff000000;
 411         if (((char*)(&endianTest))[0] != 0)
 412             sprops.cpu_endian = "big";
 413         else
 414             sprops.cpu_endian = "little";
 415     }
 416 
 417     /* os properties */
 418     {
 419 #ifdef MACOSX
 420         setOSNameAndVersion(&sprops);
 421 #else
 422         struct utsname name;
 423         uname(&name);
 424         sprops.os_name = strdup(name.sysname);
 425 #ifdef _AIX
 426         {
 427             char *os_version = malloc(strlen(name.version) +
 428                                       strlen(name.release) + 2);
 429             if (os_version != NULL) {
 430                 strcpy(os_version, name.version);
 431                 strcat(os_version, ".");
 432                 strcat(os_version, name.release);
 433             }
 434             sprops.os_version = os_version;
 435         }
 436 #else
 437         sprops.os_version = strdup(name.release);
 438 #endif /* _AIX   */
 439 #endif /* MACOSX */
 440 
 441         sprops.os_arch = ARCHPROPNAME;
 442     }
 443 
 444     /* ABI property (optional) */
 445 #ifdef JDK_ARCH_ABI_PROP_NAME
 446     sprops.sun_arch_abi = JDK_ARCH_ABI_PROP_NAME;
 447 #endif
 448 
 449     /* Determine the language, country, variant, and encoding from the host,
 450      * and store these in the user.language, user.country, user.variant and
 451      * file.encoding system properties. */
 452     setlocale(LC_ALL, "");
 453     if (ParseLocale(env, LC_CTYPE,
 454                     &(sprops.format_language),
 455                     &(sprops.format_script),
 456                     &(sprops.format_country),
 457                     &(sprops.format_variant),
 458                     &(sprops.encoding))) {
 459         ParseLocale(env, LC_MESSAGES,
 460                     &(sprops.display_language),
 461                     &(sprops.display_script),
 462                     &(sprops.display_country),
 463                     &(sprops.display_variant),
 464                     NULL);
 465     } else {
 466         sprops.display_language = "en";
 467         sprops.encoding = "ISO8859-1";
 468     }
 469 
 470     /* ParseLocale failed with OOME */
 471     JNU_CHECK_EXCEPTION_RETURN(env, NULL);
 472 
 473 #ifdef MACOSX
 474     sprops.sun_jnu_encoding = "UTF-8";
 475 #else
 476     sprops.sun_jnu_encoding = sprops.encoding;
 477 #endif
 478 
 479 #ifdef _ALLBSD_SOURCE
 480 #if BYTE_ORDER == _LITTLE_ENDIAN
 481      sprops.unicode_encoding = "UnicodeLittle";
 482  #else
 483      sprops.unicode_encoding = "UnicodeBig";
 484  #endif
 485 #else /* !_ALLBSD_SOURCE */
 486 #ifdef __linux__
 487 #if __BYTE_ORDER == __LITTLE_ENDIAN
 488     sprops.unicode_encoding = "UnicodeLittle";
 489 #else
 490     sprops.unicode_encoding = "UnicodeBig";
 491 #endif
 492 #else
 493     sprops.unicode_encoding = "UnicodeBig";
 494 #endif
 495 #endif /* _ALLBSD_SOURCE */
 496 
 497     /* user properties */
 498     {
 499         struct passwd *pwent = getpwuid(getuid());
 500         sprops.user_name = pwent ? strdup(pwent->pw_name) : "?";
 501 #ifdef MACOSX
 502         setUserHome(&sprops);
 503 #else
 504         sprops.user_home = pwent ? strdup(pwent->pw_dir) : NULL;
 505 #endif
 506         if (sprops.user_home == NULL) {
 507             sprops.user_home = "?";
 508         }
 509     }
 510 
 511     /* User TIMEZONE
 512      * We defer setting up timezone until it's actually necessary.
 513      * Refer to TimeZone.getDefault(). The system property
 514      * is able to be set by the command line interface -Duser.timezone.
 515      */
 516     tzset();        /* for compatibility */
 517 
 518     /* Current directory */
 519     {
 520         char buf[MAXPATHLEN];
 521         errno = 0;
 522         if (getcwd(buf, sizeof(buf))  == NULL)
 523             JNU_ThrowByName(env, "java/lang/Error",
 524              "Properties init: Could not determine current working directory.");
 525         else
 526             sprops.user_dir = strdup(buf);
 527     }
 528 
 529     sprops.file_separator = "/";
 530     sprops.path_separator = ":";
 531     sprops.line_separator = "\n";
 532 
 533 #ifdef MACOSX
 534     setProxyProperties(&sprops);
 535 #endif
 536 
 537     return &sprops;
 538 }
 539 
 540 jstring
 541 GetStringPlatform(JNIEnv *env, nchar* cstr)
 542 {
 543     return JNU_NewStringPlatform(env, cstr);
 544 }