gettext-tools/src/write-po.c

*946379e7Schristos/* GNU gettext - internationalization aids
*946379e7Schristos   Copyright (C) 1995-1998, 2000-2006 Free Software Foundation, Inc.
*946379e7Schristos
*946379e7Schristos   This file was written by Peter Miller <millerp@canb.auug.org.au>
*946379e7Schristos
*946379e7Schristos   This program is free software; you can redistribute it and/or modify
*946379e7Schristos   it under the terms of the GNU General Public License as published by
*946379e7Schristos   the Free Software Foundation; either version 2, or (at your option)
*946379e7Schristos   any later version.
*946379e7Schristos
*946379e7Schristos   This program is distributed in the hope that it will be useful,
*946379e7Schristos   but WITHOUT ANY WARRANTY; without even the implied warranty of
*946379e7Schristos   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
*946379e7Schristos   GNU General Public License for more details.
*946379e7Schristos
*946379e7Schristos   You should have received a copy of the GNU General Public License
*946379e7Schristos   along with this program; if not, write to the Free Software Foundation,
*946379e7Schristos   Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.  */
*946379e7Schristos
*946379e7Schristos#ifdef HAVE_CONFIG_H
*946379e7Schristos# include <config.h>
*946379e7Schristos#endif
*946379e7Schristos#include <alloca.h>
*946379e7Schristos
*946379e7Schristos/* Specification.  */
*946379e7Schristos#include "write-po.h"
*946379e7Schristos
*946379e7Schristos#include <errno.h>
*946379e7Schristos#include <limits.h>
*946379e7Schristos#include <stdio.h>
*946379e7Schristos#include <stdlib.h>
*946379e7Schristos#include <string.h>
*946379e7Schristos
*946379e7Schristos#if HAVE_ICONV
*946379e7Schristos# include <iconv.h>
*946379e7Schristos#endif
*946379e7Schristos
*946379e7Schristos#include "c-ctype.h"
*946379e7Schristos#include "po-charset.h"
*946379e7Schristos#include "linebreak.h"
*946379e7Schristos#include "msgl-ascii.h"
*946379e7Schristos#include "write-properties.h"
*946379e7Schristos#include "write-stringtable.h"
*946379e7Schristos#include "xalloc.h"
*946379e7Schristos#include "xallocsa.h"
*946379e7Schristos#include "c-strstr.h"
*946379e7Schristos#include "xvasprintf.h"
*946379e7Schristos#include "po-xerror.h"
*946379e7Schristos#include "gettext.h"
*946379e7Schristos
*946379e7Schristos/* Our regular abbreviation.  */
*946379e7Schristos#define _(str) gettext (str)
*946379e7Schristos
*946379e7Schristos#if HAVE_DECL_PUTC_UNLOCKED
*946379e7Schristos# undef putc
*946379e7Schristos# define putc putc_unlocked
*946379e7Schristos#endif
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* =================== Putting together a #, flags line. =================== */
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Convert IS_FORMAT in the context of programming language LANG to a flag
*946379e7Schristos   string for use in #, flags.  */
*946379e7Schristos
*946379e7Schristosconst char *
*946379e7Schristosmake_format_description_string (enum is_format is_format, const char *lang,
*946379e7Schristos				bool debug)
*946379e7Schristos{
*946379e7Schristos  static char result[100];
*946379e7Schristos
*946379e7Schristos  switch (is_format)
*946379e7Schristos    {
*946379e7Schristos    case possible:
*946379e7Schristos      if (debug)
*946379e7Schristos	{
*946379e7Schristos	  sprintf (result, " possible-%s-format", lang);
*946379e7Schristos	  break;
*946379e7Schristos	}
*946379e7Schristos      /* FALLTHROUGH */
*946379e7Schristos    case yes_according_to_context:
*946379e7Schristos    case yes:
*946379e7Schristos      sprintf (result, " %s-format", lang);
*946379e7Schristos      break;
*946379e7Schristos    case no:
*946379e7Schristos      sprintf (result, " no-%s-format", lang);
*946379e7Schristos      break;
*946379e7Schristos    default:
*946379e7Schristos      /* The others have already been filtered out by significant_format_p.  */
*946379e7Schristos      abort ();
*946379e7Schristos    }
*946379e7Schristos
*946379e7Schristos  return result;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Return true if IS_FORMAT is worth mentioning in a #, flags list.  */
*946379e7Schristos
*946379e7Schristosbool
*946379e7Schristossignificant_format_p (enum is_format is_format)
*946379e7Schristos{
*946379e7Schristos  return is_format != undecided && is_format != impossible;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Return true if one of IS_FORMAT is worth mentioning in a #, flags list.  */
*946379e7Schristos
*946379e7Schristosstatic bool
*946379e7Schristoshas_significant_format_p (const enum is_format is_format[NFORMATS])
*946379e7Schristos{
*946379e7Schristos  size_t i;
*946379e7Schristos
*946379e7Schristos  for (i = 0; i < NFORMATS; i++)
*946379e7Schristos    if (significant_format_p (is_format[i]))
*946379e7Schristos      return true;
*946379e7Schristos  return false;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Convert a wrapping flag DO_WRAP to a string for use in #, flags.  */
*946379e7Schristos
*946379e7Schristosstatic const char *
*946379e7Schristosmake_c_width_description_string (enum is_wrap do_wrap)
*946379e7Schristos{
*946379e7Schristos  const char *result = NULL;
*946379e7Schristos
*946379e7Schristos  switch (do_wrap)
*946379e7Schristos    {
*946379e7Schristos    case yes:
*946379e7Schristos      result = " wrap";
*946379e7Schristos      break;
*946379e7Schristos    case no:
*946379e7Schristos      result = " no-wrap";
*946379e7Schristos      break;
*946379e7Schristos    default:
*946379e7Schristos      abort ();
*946379e7Schristos    }
*946379e7Schristos
*946379e7Schristos  return result;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* ================ Output parts of a message, as comments. ================ */
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Output mp->comment as a set of comment lines.  */
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_print_comment (const message_ty *mp, FILE *fp)
*946379e7Schristos{
*946379e7Schristos  if (mp->comment != NULL)
*946379e7Schristos    {
*946379e7Schristos      size_t j;
*946379e7Schristos
*946379e7Schristos      for (j = 0; j < mp->comment->nitems; ++j)
*946379e7Schristos	{
*946379e7Schristos	  const char *s = mp->comment->item[j];
*946379e7Schristos	  do
*946379e7Schristos	    {
*946379e7Schristos	      const char *e;
*946379e7Schristos	      putc ('#', fp);
*946379e7Schristos	      if (*s != '\0' && *s != ' ')
*946379e7Schristos		putc (' ', fp);
*946379e7Schristos	      e = strchr (s, '\n');
*946379e7Schristos	      if (e == NULL)
*946379e7Schristos		{
*946379e7Schristos		  fputs (s, fp);
*946379e7Schristos		  s = NULL;
*946379e7Schristos		}
*946379e7Schristos	      else
*946379e7Schristos		{
*946379e7Schristos		  fwrite (s, 1, e - s, fp);
*946379e7Schristos		  s = e + 1;
*946379e7Schristos		}
*946379e7Schristos	      putc ('\n', fp);
*946379e7Schristos	    }
*946379e7Schristos	  while (s != NULL);
*946379e7Schristos	}
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Output mp->comment_dot as a set of comment lines.  */
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_print_comment_dot (const message_ty *mp, FILE *fp)
*946379e7Schristos{
*946379e7Schristos  if (mp->comment_dot != NULL)
*946379e7Schristos    {
*946379e7Schristos      size_t j;
*946379e7Schristos
*946379e7Schristos      for (j = 0; j < mp->comment_dot->nitems; ++j)
*946379e7Schristos	{
*946379e7Schristos	  const char *s = mp->comment_dot->item[j];
*946379e7Schristos	  putc ('#', fp);
*946379e7Schristos	  putc ('.', fp);
*946379e7Schristos	  if (*s != '\0' && *s != ' ')
*946379e7Schristos	    putc (' ', fp);
*946379e7Schristos	  fputs (s, fp);
*946379e7Schristos	  putc ('\n', fp);
*946379e7Schristos	}
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Output mp->filepos as a set of comment lines.  */
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_print_comment_filepos (const message_ty *mp, FILE *fp,
*946379e7Schristos			       bool uniforum, size_t page_width)
*946379e7Schristos{
*946379e7Schristos  if (mp->filepos_count != 0)
*946379e7Schristos    {
*946379e7Schristos      if (uniforum)
*946379e7Schristos	{
*946379e7Schristos	  size_t j;
*946379e7Schristos
*946379e7Schristos	  for (j = 0; j < mp->filepos_count; ++j)
*946379e7Schristos	    {
*946379e7Schristos	      lex_pos_ty *pp = &mp->filepos[j];
*946379e7Schristos	      char *cp = pp->file_name;
*946379e7Schristos	      while (cp[0] == '.' && cp[1] == '/')
*946379e7Schristos		cp += 2;
*946379e7Schristos	      /* There are two Sun formats to choose from: SunOS and
*946379e7Schristos		 Solaris.  Use the Solaris form here.  */
*946379e7Schristos	      fprintf (fp, "# File: %s, line: %ld\n",
*946379e7Schristos		       cp, (long) pp->line_number);
*946379e7Schristos	    }
*946379e7Schristos	}
*946379e7Schristos      else
*946379e7Schristos	{
*946379e7Schristos	  size_t column;
*946379e7Schristos	  size_t j;
*946379e7Schristos
*946379e7Schristos	  fputs ("#:", fp);
*946379e7Schristos	  column = 2;
*946379e7Schristos	  for (j = 0; j < mp->filepos_count; ++j)
*946379e7Schristos	    {
*946379e7Schristos	      lex_pos_ty *pp;
*946379e7Schristos	      char buffer[21];
*946379e7Schristos	      char *cp;
*946379e7Schristos	      size_t len;
*946379e7Schristos
*946379e7Schristos	      pp = &mp->filepos[j];
*946379e7Schristos	      cp = pp->file_name;
*946379e7Schristos	      while (cp[0] == '.' && cp[1] == '/')
*946379e7Schristos		cp += 2;
*946379e7Schristos	      /* Some xgettext input formats, like RST, lack line numbers.  */
*946379e7Schristos	      if (pp->line_number == (size_t)(-1))
*946379e7Schristos		buffer[0] = '\0';
*946379e7Schristos	      else
*946379e7Schristos		sprintf (buffer, ":%ld", (long) pp->line_number);
*946379e7Schristos	      len = strlen (cp) + strlen (buffer) + 1;
*946379e7Schristos	      if (column > 2 && column + len >= page_width)
*946379e7Schristos		{
*946379e7Schristos		  fputs ("\n#:", fp);
*946379e7Schristos		  column = 2;
*946379e7Schristos		}
*946379e7Schristos	      fprintf (fp, " %s%s", cp, buffer);
*946379e7Schristos	      column += len;
*946379e7Schristos	    }
*946379e7Schristos	  putc ('\n', fp);
*946379e7Schristos	}
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Output mp->is_fuzzy, mp->is_format, mp->do_wrap as a comment line.  */
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_print_comment_flags (const message_ty *mp, FILE *fp, bool debug)
*946379e7Schristos{
*946379e7Schristos  if ((mp->is_fuzzy && mp->msgstr[0] != '\0')
*946379e7Schristos      || has_significant_format_p (mp->is_format)
*946379e7Schristos      || mp->do_wrap == no)
*946379e7Schristos    {
*946379e7Schristos      bool first_flag = true;
*946379e7Schristos      size_t i;
*946379e7Schristos
*946379e7Schristos      putc ('#', fp);
*946379e7Schristos      putc (',', fp);
*946379e7Schristos
*946379e7Schristos      /* We don't print the fuzzy flag if the msgstr is empty.  This
*946379e7Schristos	 might be introduced by the user but we want to normalize the
*946379e7Schristos	 output.  */
*946379e7Schristos      if (mp->is_fuzzy && mp->msgstr[0] != '\0')
*946379e7Schristos	{
*946379e7Schristos	  fputs (" fuzzy", fp);
*946379e7Schristos	  first_flag = false;
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      for (i = 0; i < NFORMATS; i++)
*946379e7Schristos	if (significant_format_p (mp->is_format[i]))
*946379e7Schristos	  {
*946379e7Schristos	    if (!first_flag)
*946379e7Schristos	      putc (',', fp);
*946379e7Schristos
*946379e7Schristos	    fputs (make_format_description_string (mp->is_format[i],
*946379e7Schristos						   format_language[i], debug),
*946379e7Schristos		   fp);
*946379e7Schristos	    first_flag = false;
*946379e7Schristos	  }
*946379e7Schristos
*946379e7Schristos      if (mp->do_wrap == no)
*946379e7Schristos	{
*946379e7Schristos	  if (!first_flag)
*946379e7Schristos	    putc (',', fp);
*946379e7Schristos
*946379e7Schristos	  fputs (make_c_width_description_string (mp->do_wrap), fp);
*946379e7Schristos	  first_flag = false;
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      putc ('\n', fp);
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* ========= Some parameters for use by 'msgdomain_list_print_po'. ========= */
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* This variable controls the extent to which the page width applies.
*946379e7Schristos   True means it applies to message strings and file reference lines.
*946379e7Schristos   False means it applies to file reference lines only.  */
*946379e7Schristosstatic bool wrap_strings = true;
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_page_width_ignore ()
*946379e7Schristos{
*946379e7Schristos  wrap_strings = false;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* These three variables control the output style of the message_print
*946379e7Schristos   function.  Interface functions for them are to be used.  */
*946379e7Schristosstatic bool indent = false;
*946379e7Schristosstatic bool uniforum = false;
*946379e7Schristosstatic bool escape = false;
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_print_style_indent ()
*946379e7Schristos{
*946379e7Schristos  indent = true;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_print_style_uniforum ()
*946379e7Schristos{
*946379e7Schristos  uniforum = true;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristosvoid
*946379e7Schristosmessage_print_style_escape (bool flag)
*946379e7Schristos{
*946379e7Schristos  escape = flag;
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* =============== msgdomain_list_print_po() and subroutines. =============== */
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* A version of memcpy optimized for the case n <= 1.  */
*946379e7Schristosstatic inline void
*946379e7Schristosmemcpy_small (void *dst, const void *src, size_t n)
*946379e7Schristos{
*946379e7Schristos  if (n > 0)
*946379e7Schristos    {
*946379e7Schristos      char *q = (char *) dst;
*946379e7Schristos      const char *p = (const char *) src;
*946379e7Schristos
*946379e7Schristos      *q = *p;
*946379e7Schristos      if (--n > 0)
*946379e7Schristos	do *++q = *++p; while (--n > 0);
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristosstatic void
*946379e7Schristoswrap (const message_ty *mp, FILE *fp, const char *line_prefix, int extra_indent,
*946379e7Schristos      const char *name, const char *value,
*946379e7Schristos      enum is_wrap do_wrap, size_t page_width,
*946379e7Schristos      const char *charset)
*946379e7Schristos{
*946379e7Schristos  const char *canon_charset;
*946379e7Schristos  const char *s;
*946379e7Schristos  bool first_line;
*946379e7Schristos#if HAVE_ICONV
*946379e7Schristos  const char *envval;
*946379e7Schristos  iconv_t conv;
*946379e7Schristos#endif
*946379e7Schristos  bool weird_cjk;
*946379e7Schristos
*946379e7Schristos  canon_charset = po_charset_canonicalize (charset);
*946379e7Schristos
*946379e7Schristos#if HAVE_ICONV
*946379e7Schristos  /* The old Solaris/openwin msgfmt and GNU msgfmt <= 0.10.35 don't know
*946379e7Schristos     about multibyte encodings, and require a spurious backslash after
*946379e7Schristos     every multibyte character whose last byte is 0x5C.  Some programs,
*946379e7Schristos     like vim, distribute PO files in this broken format.  It is important
*946379e7Schristos     for such programs that GNU msgmerge continues to support this old
*946379e7Schristos     PO file format when the Makefile requests it.  */
*946379e7Schristos  envval = getenv ("OLD_PO_FILE_OUTPUT");
*946379e7Schristos  if (envval != NULL && *envval != '\0')
*946379e7Schristos    /* Write a PO file in old format, with extraneous backslashes.  */
*946379e7Schristos    conv = (iconv_t)(-1);
*946379e7Schristos  else
*946379e7Schristos    if (canon_charset == NULL)
*946379e7Schristos      /* Invalid PO file encoding.  */
*946379e7Schristos      conv = (iconv_t)(-1);
*946379e7Schristos    else
*946379e7Schristos      /* Avoid glibc-2.1 bug with EUC-KR.  */
*946379e7Schristos# if (__GLIBC__ - 0 == 2 && __GLIBC_MINOR__ - 0 <= 1) && !defined _LIBICONV_VERSION
*946379e7Schristos      if (strcmp (canon_charset, "EUC-KR") == 0)
*946379e7Schristos	conv = (iconv_t)(-1);
*946379e7Schristos      else
*946379e7Schristos# endif
*946379e7Schristos      /* Avoid Solaris 2.9 bug with GB2312, EUC-TW, BIG5, BIG5-HKSCS, GBK,
*946379e7Schristos	 GB18030.  */
*946379e7Schristos# if defined __sun && !defined _LIBICONV_VERSION
*946379e7Schristos      if (   strcmp (canon_charset, "GB2312") == 0
*946379e7Schristos	  || strcmp (canon_charset, "EUC-TW") == 0
*946379e7Schristos	  || strcmp (canon_charset, "BIG5") == 0
*946379e7Schristos	  || strcmp (canon_charset, "BIG5-HKSCS") == 0
*946379e7Schristos	  || strcmp (canon_charset, "GBK") == 0
*946379e7Schristos	  || strcmp (canon_charset, "GB18030") == 0)
*946379e7Schristos	conv = (iconv_t)(-1);
*946379e7Schristos      else
*946379e7Schristos# endif
*946379e7Schristos      /* Use iconv() to parse multibyte characters.  */
*946379e7Schristos      conv = iconv_open ("UTF-8", canon_charset);
*946379e7Schristos
*946379e7Schristos  if (conv != (iconv_t)(-1))
*946379e7Schristos    weird_cjk = false;
*946379e7Schristos  else
*946379e7Schristos#endif
*946379e7Schristos    if (canon_charset == NULL)
*946379e7Schristos      weird_cjk = false;
*946379e7Schristos    else
*946379e7Schristos      weird_cjk = po_is_charset_weird_cjk (canon_charset);
*946379e7Schristos
*946379e7Schristos  if (canon_charset == NULL)
*946379e7Schristos    canon_charset = po_charset_ascii;
*946379e7Schristos
*946379e7Schristos  /* Loop over the '\n' delimited portions of value.  */
*946379e7Schristos  s = value;
*946379e7Schristos  first_line = true;
*946379e7Schristos  do
*946379e7Schristos    {
*946379e7Schristos      /* The usual escapes, as defined by the ANSI C Standard.  */
*946379e7Schristos#     define is_escape(c) \
*946379e7Schristos        ((c) == '\a' || (c) == '\b' || (c) == '\f' || (c) == '\n' \
*946379e7Schristos         || (c) == '\r' || (c) == '\t' || (c) == '\v')
*946379e7Schristos
*946379e7Schristos      const char *es;
*946379e7Schristos      const char *ep;
*946379e7Schristos      size_t portion_len;
*946379e7Schristos      char *portion;
*946379e7Schristos      char *overrides;
*946379e7Schristos      char *linebreaks;
*946379e7Schristos      char *pp;
*946379e7Schristos      char *op;
*946379e7Schristos      int startcol, startcol_after_break, width;
*946379e7Schristos      size_t i;
*946379e7Schristos
*946379e7Schristos      for (es = s; *es != '\0'; )
*946379e7Schristos	if (*es++ == '\n')
*946379e7Schristos	  break;
*946379e7Schristos
*946379e7Schristos      /* Expand escape sequences in each portion.  */
*946379e7Schristos      for (ep = s, portion_len = 0; ep < es; ep++)
*946379e7Schristos	{
*946379e7Schristos	  char c = *ep;
*946379e7Schristos	  if (is_escape (c))
*946379e7Schristos	    portion_len += 2;
*946379e7Schristos	  else if (escape && !c_isprint ((unsigned char) c))
*946379e7Schristos	    portion_len += 4;
*946379e7Schristos	  else if (c == '\\' || c == '"')
*946379e7Schristos	    portion_len += 2;
*946379e7Schristos	  else
*946379e7Schristos	    {
*946379e7Schristos#if HAVE_ICONV
*946379e7Schristos	      if (conv != (iconv_t)(-1))
*946379e7Schristos		{
*946379e7Schristos		  /* Skip over a complete multi-byte character.  Don't
*946379e7Schristos		     interpret the second byte of a multi-byte character as
*946379e7Schristos		     ASCII.  This is needed for the BIG5, BIG5-HKSCS, GBK,
*946379e7Schristos		     GB18030, SHIFT_JIS, JOHAB encodings.  */
*946379e7Schristos		  char scratchbuf[64];
*946379e7Schristos		  const char *inptr = ep;
*946379e7Schristos		  size_t insize;
*946379e7Schristos		  char *outptr = &scratchbuf[0];
*946379e7Schristos		  size_t outsize = sizeof (scratchbuf);
*946379e7Schristos		  size_t res;
*946379e7Schristos
*946379e7Schristos		  res = (size_t)(-1);
*946379e7Schristos		  for (insize = 1; inptr + insize <= es; insize++)
*946379e7Schristos		    {
*946379e7Schristos		      res = iconv (conv,
*946379e7Schristos				   (ICONV_CONST char **) &inptr, &insize,
*946379e7Schristos				   &outptr, &outsize);
*946379e7Schristos		      if (!(res == (size_t)(-1) && errno == EINVAL))
*946379e7Schristos			break;
*946379e7Schristos		      /* We expect that no input bytes have been consumed
*946379e7Schristos			 so far.  */
*946379e7Schristos		      if (inptr != ep)
*946379e7Schristos			abort ();
*946379e7Schristos		    }
*946379e7Schristos		  if (res == (size_t)(-1))
*946379e7Schristos		    {
*946379e7Schristos		      if (errno == EILSEQ)
*946379e7Schristos			{
*946379e7Schristos			  po_xerror (PO_SEVERITY_ERROR, mp, NULL, 0, 0, false,
*946379e7Schristos				     _("invalid multibyte sequence"));
*946379e7Schristos			  continue;
*946379e7Schristos			}
*946379e7Schristos		      else
*946379e7Schristos			abort ();
*946379e7Schristos		    }
*946379e7Schristos		  insize = inptr - ep;
*946379e7Schristos		  portion_len += insize;
*946379e7Schristos		  ep += insize - 1;
*946379e7Schristos		}
*946379e7Schristos	      else
*946379e7Schristos#endif
*946379e7Schristos		{
*946379e7Schristos		  if (weird_cjk
*946379e7Schristos		      /* Special handling of encodings with CJK structure.  */
*946379e7Schristos		      && ep + 2 <= es
*946379e7Schristos		      && (unsigned char) ep[0] >= 0x80
*946379e7Schristos		      && (unsigned char) ep[1] >= 0x30)
*946379e7Schristos		    {
*946379e7Schristos		      portion_len += 2;
*946379e7Schristos		      ep += 1;
*946379e7Schristos		    }
*946379e7Schristos		  else
*946379e7Schristos		    portion_len += 1;
*946379e7Schristos		}
*946379e7Schristos	    }
*946379e7Schristos	}
*946379e7Schristos      portion = (char *) xmalloc (portion_len);
*946379e7Schristos      overrides = (char *) xmalloc (portion_len);
*946379e7Schristos      memset (overrides, UC_BREAK_UNDEFINED, portion_len);
*946379e7Schristos      for (ep = s, pp = portion, op = overrides; ep < es; ep++)
*946379e7Schristos	{
*946379e7Schristos	  char c = *ep;
*946379e7Schristos	  if (is_escape (c))
*946379e7Schristos	    {
*946379e7Schristos	      switch (c)
*946379e7Schristos		{
*946379e7Schristos		case '\a': c = 'a'; break;
*946379e7Schristos		case '\b': c = 'b'; break;
*946379e7Schristos		case '\f': c = 'f'; break;
*946379e7Schristos		case '\n': c = 'n'; break;
*946379e7Schristos		case '\r': c = 'r'; break;
*946379e7Schristos		case '\t': c = 't'; break;
*946379e7Schristos		case '\v': c = 'v'; break;
*946379e7Schristos		default: abort ();
*946379e7Schristos		}
*946379e7Schristos	      *pp++ = '\\';
*946379e7Schristos	      *pp++ = c;
*946379e7Schristos	      op++;
*946379e7Schristos	      *op++ = UC_BREAK_PROHIBITED;
*946379e7Schristos	      /* We warn about any use of escape sequences beside
*946379e7Schristos		 '\n' and '\t'.  */
*946379e7Schristos	      if (c != 'n' && c != 't')
*946379e7Schristos		{
*946379e7Schristos		  char *error_message =
*946379e7Schristos		    xasprintf (_("\
*946379e7Schristosinternationalized messages should not contain the `\\%c' escape sequence"),
*946379e7Schristos			       c);
*946379e7Schristos		  po_xerror (PO_SEVERITY_ERROR, mp, NULL, 0, 0, false,
*946379e7Schristos			     error_message);
*946379e7Schristos		  free (error_message);
*946379e7Schristos		}
*946379e7Schristos	    }
*946379e7Schristos	  else if (escape && !c_isprint ((unsigned char) c))
*946379e7Schristos	    {
*946379e7Schristos	      *pp++ = '\\';
*946379e7Schristos	      *pp++ = '0' + (((unsigned char) c >> 6) & 7);
*946379e7Schristos	      *pp++ = '0' + (((unsigned char) c >> 3) & 7);
*946379e7Schristos	      *pp++ = '0' + ((unsigned char) c & 7);
*946379e7Schristos	      op++;
*946379e7Schristos	      *op++ = UC_BREAK_PROHIBITED;
*946379e7Schristos	      *op++ = UC_BREAK_PROHIBITED;
*946379e7Schristos	      *op++ = UC_BREAK_PROHIBITED;
*946379e7Schristos	    }
*946379e7Schristos	  else if (c == '\\' || c == '"')
*946379e7Schristos	    {
*946379e7Schristos	      *pp++ = '\\';
*946379e7Schristos	      *pp++ = c;
*946379e7Schristos	      op++;
*946379e7Schristos	      *op++ = UC_BREAK_PROHIBITED;
*946379e7Schristos	    }
*946379e7Schristos	  else
*946379e7Schristos	    {
*946379e7Schristos#if HAVE_ICONV
*946379e7Schristos	      if (conv != (iconv_t)(-1))
*946379e7Schristos		{
*946379e7Schristos		  /* Copy a complete multi-byte character.  Don't
*946379e7Schristos		     interpret the second byte of a multi-byte character as
*946379e7Schristos		     ASCII.  This is needed for the BIG5, BIG5-HKSCS, GBK,
*946379e7Schristos		     GB18030, SHIFT_JIS, JOHAB encodings.  */
*946379e7Schristos		  char scratchbuf[64];
*946379e7Schristos		  const char *inptr = ep;
*946379e7Schristos		  size_t insize;
*946379e7Schristos		  char *outptr = &scratchbuf[0];
*946379e7Schristos		  size_t outsize = sizeof (scratchbuf);
*946379e7Schristos		  size_t res;
*946379e7Schristos
*946379e7Schristos		  res = (size_t)(-1);
*946379e7Schristos		  for (insize = 1; inptr + insize <= es; insize++)
*946379e7Schristos		    {
*946379e7Schristos		      res = iconv (conv,
*946379e7Schristos				   (ICONV_CONST char **) &inptr, &insize,
*946379e7Schristos				   &outptr, &outsize);
*946379e7Schristos		      if (!(res == (size_t)(-1) && errno == EINVAL))
*946379e7Schristos			break;
*946379e7Schristos		      /* We expect that no input bytes have been consumed
*946379e7Schristos			 so far.  */
*946379e7Schristos		      if (inptr != ep)
*946379e7Schristos			abort ();
*946379e7Schristos		    }
*946379e7Schristos		  if (res == (size_t)(-1))
*946379e7Schristos		    {
*946379e7Schristos		      if (errno == EILSEQ)
*946379e7Schristos			{
*946379e7Schristos			  po_xerror (PO_SEVERITY_ERROR, mp, NULL, 0, 0,
*946379e7Schristos				     false, _("invalid multibyte sequence"));
*946379e7Schristos			  continue;
*946379e7Schristos			}
*946379e7Schristos		      else
*946379e7Schristos			abort ();
*946379e7Schristos		    }
*946379e7Schristos		  insize = inptr - ep;
*946379e7Schristos		  memcpy_small (pp, ep, insize);
*946379e7Schristos		  pp += insize;
*946379e7Schristos		  op += insize;
*946379e7Schristos		  ep += insize - 1;
*946379e7Schristos		}
*946379e7Schristos	      else
*946379e7Schristos#endif
*946379e7Schristos		{
*946379e7Schristos		  if (weird_cjk
*946379e7Schristos		      /* Special handling of encodings with CJK structure.  */
*946379e7Schristos		      && ep + 2 <= es
*946379e7Schristos		      && (unsigned char) c >= 0x80
*946379e7Schristos		      && (unsigned char) ep[1] >= 0x30)
*946379e7Schristos		    {
*946379e7Schristos		      *pp++ = c;
*946379e7Schristos		      ep += 1;
*946379e7Schristos		      *pp++ = *ep;
*946379e7Schristos		      op += 2;
*946379e7Schristos		    }
*946379e7Schristos		  else
*946379e7Schristos		    {
*946379e7Schristos		      *pp++ = c;
*946379e7Schristos		      op++;
*946379e7Schristos		    }
*946379e7Schristos		}
*946379e7Schristos	    }
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      /* Don't break immediately before the "\n" at the end.  */
*946379e7Schristos      if (es > s && es[-1] == '\n')
*946379e7Schristos	overrides[portion_len - 2] = UC_BREAK_PROHIBITED;
*946379e7Schristos
*946379e7Schristos      linebreaks = (char *) xmalloc (portion_len);
*946379e7Schristos
*946379e7Schristos      /* Subsequent lines after a break are all indented.
*946379e7Schristos	 See INDENT-S.  */
*946379e7Schristos      startcol_after_break = (line_prefix ? strlen (line_prefix) : 0);
*946379e7Schristos      if (indent)
*946379e7Schristos	startcol_after_break = (startcol_after_break + extra_indent + 8) & ~7;
*946379e7Schristos      startcol_after_break++;
*946379e7Schristos
*946379e7Schristos      /* The line width.  Allow room for the closing quote character.  */
*946379e7Schristos      width = (wrap_strings && do_wrap != no ? page_width : INT_MAX) - 1;
*946379e7Schristos      /* Adjust for indentation of subsequent lines.  */
*946379e7Schristos      width -= startcol_after_break;
*946379e7Schristos
*946379e7Schristos    recompute:
*946379e7Schristos      /* The line starts with different things depending on whether it
*946379e7Schristos	 is the first line, and if we are using the indented style.
*946379e7Schristos	 See INDENT-F.  */
*946379e7Schristos      startcol = (line_prefix ? strlen (line_prefix) : 0);
*946379e7Schristos      if (first_line)
*946379e7Schristos	{
*946379e7Schristos	  startcol += strlen (name);
*946379e7Schristos	  if (indent)
*946379e7Schristos	    startcol = (startcol + extra_indent + 8) & ~7;
*946379e7Schristos	  else
*946379e7Schristos	    startcol++;
*946379e7Schristos	}
*946379e7Schristos      else
*946379e7Schristos	{
*946379e7Schristos	  if (indent)
*946379e7Schristos	    startcol = (startcol + extra_indent + 8) & ~7;
*946379e7Schristos	}
*946379e7Schristos      /* Allow room for the opening quote character.  */
*946379e7Schristos      startcol++;
*946379e7Schristos      /* Adjust for indentation of subsequent lines.  */
*946379e7Schristos      startcol -= startcol_after_break;
*946379e7Schristos
*946379e7Schristos      /* Do line breaking on the portion.  */
*946379e7Schristos      mbs_width_linebreaks (portion, portion_len, width, startcol, 0,
*946379e7Schristos			    overrides, canon_charset, linebreaks);
*946379e7Schristos
*946379e7Schristos      /* If this is the first line, and we are not using the indented
*946379e7Schristos	 style, and the line would wrap, then use an empty first line
*946379e7Schristos	 and restart.  */
*946379e7Schristos      if (first_line && !indent
*946379e7Schristos	  && portion_len > 0
*946379e7Schristos	  && (*es != '\0'
*946379e7Schristos	      || startcol > width
*946379e7Schristos	      || memchr (linebreaks, UC_BREAK_POSSIBLE, portion_len) != NULL))
*946379e7Schristos	{
*946379e7Schristos	  if (line_prefix != NULL)
*946379e7Schristos	    fputs (line_prefix, fp);
*946379e7Schristos	  fputs (name, fp);
*946379e7Schristos	  fputs (" \"\"\n", fp);
*946379e7Schristos	  first_line = false;
*946379e7Schristos	  /* Recompute startcol and linebreaks.  */
*946379e7Schristos	  goto recompute;
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      /* Print the beginning of the line.  This will depend on whether
*946379e7Schristos	 this is the first line, and if the indented style is being
*946379e7Schristos	 used.  INDENT-F.  */
*946379e7Schristos      if (line_prefix != NULL)
*946379e7Schristos	fputs (line_prefix, fp);
*946379e7Schristos      if (first_line)
*946379e7Schristos	{
*946379e7Schristos	  fputs (name, fp);
*946379e7Schristos	  if (indent)
*946379e7Schristos	    {
*946379e7Schristos	      if (extra_indent > 0)
*946379e7Schristos		fwrite ("        ", 1, extra_indent, fp);
*946379e7Schristos	      putc ('\t', fp);
*946379e7Schristos	    }
*946379e7Schristos	  else
*946379e7Schristos	    putc (' ', fp);
*946379e7Schristos	  first_line = false;
*946379e7Schristos	}
*946379e7Schristos      else
*946379e7Schristos	{
*946379e7Schristos	  if (indent)
*946379e7Schristos	    {
*946379e7Schristos	      if (extra_indent > 0)
*946379e7Schristos		fwrite ("        ", 1, extra_indent, fp);
*946379e7Schristos	      putc ('\t', fp);
*946379e7Schristos	    }
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      /* Print the portion itself, with linebreaks where necessary.  */
*946379e7Schristos      putc ('"', fp);
*946379e7Schristos      for (i = 0; i < portion_len; i++)
*946379e7Schristos	{
*946379e7Schristos	  if (linebreaks[i] == UC_BREAK_POSSIBLE)
*946379e7Schristos	    {
*946379e7Schristos	      fputs ("\"\n", fp);
*946379e7Schristos	      /* INDENT-S.  */
*946379e7Schristos	      if (line_prefix != NULL)
*946379e7Schristos		fputs (line_prefix, fp);
*946379e7Schristos	      if (indent)
*946379e7Schristos		putc ('\t', fp);
*946379e7Schristos	      putc ('"', fp);
*946379e7Schristos	    }
*946379e7Schristos	  putc (portion[i], fp);
*946379e7Schristos	}
*946379e7Schristos      fputs ("\"\n", fp);
*946379e7Schristos
*946379e7Schristos      free (linebreaks);
*946379e7Schristos      free (overrides);
*946379e7Schristos      free (portion);
*946379e7Schristos
*946379e7Schristos      s = es;
*946379e7Schristos#     undef is_escape
*946379e7Schristos    }
*946379e7Schristos  while (*s);
*946379e7Schristos
*946379e7Schristos#if HAVE_ICONV
*946379e7Schristos  if (conv != (iconv_t)(-1))
*946379e7Schristos    iconv_close (conv);
*946379e7Schristos#endif
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristosstatic void
*946379e7Schristosprint_blank_line (FILE *fp)
*946379e7Schristos{
*946379e7Schristos  if (uniforum)
*946379e7Schristos    fputs ("#\n", fp);
*946379e7Schristos  else
*946379e7Schristos    putc ('\n', fp);
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristosstatic void
*946379e7Schristosmessage_print (const message_ty *mp, FILE *fp, const char *charset,
*946379e7Schristos	       size_t page_width, bool blank_line, bool debug)
*946379e7Schristos{
*946379e7Schristos  int extra_indent;
*946379e7Schristos
*946379e7Schristos  /* Separate messages with a blank line.  Uniforum doesn't like blank
*946379e7Schristos     lines, so use an empty comment (unless there already is one).  */
*946379e7Schristos  if (blank_line && (!uniforum
*946379e7Schristos		     || mp->comment == NULL
*946379e7Schristos		     || mp->comment->nitems == 0
*946379e7Schristos		     || mp->comment->item[0][0] != '\0'))
*946379e7Schristos    print_blank_line (fp);
*946379e7Schristos
*946379e7Schristos  /* Print translator comment if available.  */
*946379e7Schristos  message_print_comment (mp, fp);
*946379e7Schristos
*946379e7Schristos  /* Print xgettext extracted comments.  */
*946379e7Schristos  message_print_comment_dot (mp, fp);
*946379e7Schristos
*946379e7Schristos  /* Print the file position comments.  This will help a human who is
*946379e7Schristos     trying to navigate the sources.  There is no problem of getting
*946379e7Schristos     repeated positions, because duplicates are checked for.  */
*946379e7Schristos  message_print_comment_filepos (mp, fp, uniforum, page_width);
*946379e7Schristos
*946379e7Schristos  /* Print flag information in special comment.  */
*946379e7Schristos  message_print_comment_flags (mp, fp, debug);
*946379e7Schristos
*946379e7Schristos  /* Print the previous msgid.  This helps the translator when the msgid has
*946379e7Schristos     only slightly changed.  */
*946379e7Schristos  if (mp->prev_msgctxt != NULL)
*946379e7Schristos    wrap (mp, fp, "#| ", 0, "msgctxt", mp->prev_msgctxt, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  if (mp->prev_msgid != NULL)
*946379e7Schristos    wrap (mp, fp, "#| ", 0, "msgid", mp->prev_msgid, mp->do_wrap, page_width,
*946379e7Schristos	  charset);
*946379e7Schristos  if (mp->prev_msgid_plural != NULL)
*946379e7Schristos    wrap (mp, fp, "#| ", 0, "msgid_plural", mp->prev_msgid_plural, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  extra_indent = (mp->prev_msgctxt != NULL || mp->prev_msgid != NULL
*946379e7Schristos		  || mp->prev_msgid_plural != NULL
*946379e7Schristos		  ? 3
*946379e7Schristos		  : 0);
*946379e7Schristos
*946379e7Schristos  /* Print each of the message components.  Wrap them nicely so they
*946379e7Schristos     are as readable as possible.  If there is no recorded msgstr for
*946379e7Schristos     this domain, emit an empty string.  */
*946379e7Schristos  if (mp->msgctxt != NULL && !is_ascii_string (mp->msgctxt)
*946379e7Schristos      && po_charset_canonicalize (charset) != po_charset_utf8)
*946379e7Schristos    {
*946379e7Schristos      char *warning_message =
*946379e7Schristos	xasprintf (_("\
*946379e7SchristosThe following msgctxt contains non-ASCII characters.\n\
*946379e7SchristosThis will cause problems to translators who use a character encoding\n\
*946379e7Schristosdifferent from yours. Consider using a pure ASCII msgctxt instead.\n\
*946379e7Schristos%s\n"), mp->msgctxt);
*946379e7Schristos      po_xerror (PO_SEVERITY_WARNING, mp, NULL, 0, 0, true, warning_message);
*946379e7Schristos      free (warning_message);
*946379e7Schristos    }
*946379e7Schristos  if (!is_ascii_string (mp->msgid)
*946379e7Schristos      && po_charset_canonicalize (charset) != po_charset_utf8)
*946379e7Schristos    {
*946379e7Schristos      char *warning_message =
*946379e7Schristos	xasprintf (_("\
*946379e7SchristosThe following msgid contains non-ASCII characters.\n\
*946379e7SchristosThis will cause problems to translators who use a character encoding\n\
*946379e7Schristosdifferent from yours. Consider using a pure ASCII msgid instead.\n\
*946379e7Schristos%s\n"), mp->msgid);
*946379e7Schristos      po_xerror (PO_SEVERITY_WARNING, mp, NULL, 0, 0, true, warning_message);
*946379e7Schristos      free (warning_message);
*946379e7Schristos    }
*946379e7Schristos  if (mp->msgctxt != NULL)
*946379e7Schristos    wrap (mp, fp, NULL, extra_indent, "msgctxt", mp->msgctxt, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  wrap (mp, fp, NULL, extra_indent, "msgid", mp->msgid, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  if (mp->msgid_plural != NULL)
*946379e7Schristos    wrap (mp, fp, NULL, extra_indent, "msgid_plural", mp->msgid_plural,
*946379e7Schristos	  mp->do_wrap, page_width, charset);
*946379e7Schristos
*946379e7Schristos  if (mp->msgid_plural == NULL)
*946379e7Schristos    wrap (mp, fp, NULL, extra_indent, "msgstr", mp->msgstr, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  else
*946379e7Schristos    {
*946379e7Schristos      char prefix_buf[20];
*946379e7Schristos      unsigned int i;
*946379e7Schristos      const char *p;
*946379e7Schristos
*946379e7Schristos      for (p = mp->msgstr, i = 0;
*946379e7Schristos	   p < mp->msgstr + mp->msgstr_len;
*946379e7Schristos	   p += strlen (p) + 1, i++)
*946379e7Schristos	{
*946379e7Schristos	  sprintf (prefix_buf, "msgstr[%u]", i);
*946379e7Schristos	  wrap (mp, fp, NULL, extra_indent, prefix_buf, p, mp->do_wrap,
*946379e7Schristos		page_width, charset);
*946379e7Schristos	}
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristosstatic void
*946379e7Schristosmessage_print_obsolete (const message_ty *mp, FILE *fp, const char *charset,
*946379e7Schristos			size_t page_width, bool blank_line)
*946379e7Schristos{
*946379e7Schristos  int extra_indent;
*946379e7Schristos
*946379e7Schristos  /* If msgstr is the empty string we print nothing.  */
*946379e7Schristos  if (mp->msgstr[0] == '\0')
*946379e7Schristos    return;
*946379e7Schristos
*946379e7Schristos  /* Separate messages with a blank line.  Uniforum doesn't like blank
*946379e7Schristos     lines, so use an empty comment (unless there already is one).  */
*946379e7Schristos  if (blank_line)
*946379e7Schristos    print_blank_line (fp);
*946379e7Schristos
*946379e7Schristos  /* Print translator comment if available.  */
*946379e7Schristos  message_print_comment (mp, fp);
*946379e7Schristos
*946379e7Schristos  /* Print xgettext extracted comments (normally empty).  */
*946379e7Schristos  message_print_comment_dot (mp, fp);
*946379e7Schristos
*946379e7Schristos  /* Print the file position comments (normally empty).  */
*946379e7Schristos  message_print_comment_filepos (mp, fp, uniforum, page_width);
*946379e7Schristos
*946379e7Schristos  /* Print flag information in special comment.  */
*946379e7Schristos  if (mp->is_fuzzy)
*946379e7Schristos    {
*946379e7Schristos      bool first = true;
*946379e7Schristos
*946379e7Schristos      putc ('#', fp);
*946379e7Schristos      putc (',', fp);
*946379e7Schristos
*946379e7Schristos      if (mp->is_fuzzy)
*946379e7Schristos	{
*946379e7Schristos	  fputs (" fuzzy", fp);
*946379e7Schristos	  first = false;
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      putc ('\n', fp);
*946379e7Schristos    }
*946379e7Schristos
*946379e7Schristos  /* Print the previous msgid.  This helps the translator when the msgid has
*946379e7Schristos     only slightly changed.  */
*946379e7Schristos  if (mp->prev_msgctxt != NULL)
*946379e7Schristos    wrap (mp, fp, "#~| ", 0, "msgctxt", mp->prev_msgctxt, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  if (mp->prev_msgid != NULL)
*946379e7Schristos    wrap (mp, fp, "#~| ", 0, "msgid", mp->prev_msgid, mp->do_wrap, page_width,
*946379e7Schristos	  charset);
*946379e7Schristos  if (mp->prev_msgid_plural != NULL)
*946379e7Schristos    wrap (mp, fp, "#~| ", 0, "msgid_plural", mp->prev_msgid_plural, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  extra_indent = (mp->prev_msgctxt != NULL || mp->prev_msgid != NULL
*946379e7Schristos		  || mp->prev_msgid_plural != NULL
*946379e7Schristos		  ? 1
*946379e7Schristos		  : 0);
*946379e7Schristos
*946379e7Schristos  /* Print each of the message components.  Wrap them nicely so they
*946379e7Schristos     are as readable as possible.  */
*946379e7Schristos  if (mp->msgctxt != NULL && !is_ascii_string (mp->msgctxt)
*946379e7Schristos      && po_charset_canonicalize (charset) != po_charset_utf8)
*946379e7Schristos    {
*946379e7Schristos      char *warning_message =
*946379e7Schristos	xasprintf (_("\
*946379e7SchristosThe following msgctxt contains non-ASCII characters.\n\
*946379e7SchristosThis will cause problems to translators who use a character encoding\n\
*946379e7Schristosdifferent from yours. Consider using a pure ASCII msgctxt instead.\n\
*946379e7Schristos%s\n"), mp->msgctxt);
*946379e7Schristos      po_xerror (PO_SEVERITY_WARNING, mp, NULL, 0, 0, true, warning_message);
*946379e7Schristos      free (warning_message);
*946379e7Schristos    }
*946379e7Schristos  if (!is_ascii_string (mp->msgid)
*946379e7Schristos      && po_charset_canonicalize (charset) != po_charset_utf8)
*946379e7Schristos    {
*946379e7Schristos      char *warning_message =
*946379e7Schristos	xasprintf (_("\
*946379e7SchristosThe following msgid contains non-ASCII characters.\n\
*946379e7SchristosThis will cause problems to translators who use a character encoding\n\
*946379e7Schristosdifferent from yours. Consider using a pure ASCII msgid instead.\n\
*946379e7Schristos%s\n"), mp->msgid);
*946379e7Schristos      po_xerror (PO_SEVERITY_WARNING, mp, NULL, 0, 0, true, warning_message);
*946379e7Schristos      free (warning_message);
*946379e7Schristos    }
*946379e7Schristos  if (mp->msgctxt != NULL)
*946379e7Schristos    wrap (mp, fp, "#~ ", extra_indent, "msgctxt", mp->msgctxt, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  wrap (mp, fp, "#~ ", extra_indent, "msgid", mp->msgid, mp->do_wrap,
*946379e7Schristos	page_width, charset);
*946379e7Schristos  if (mp->msgid_plural != NULL)
*946379e7Schristos    wrap (mp, fp, "#~ ", extra_indent, "msgid_plural", mp->msgid_plural,
*946379e7Schristos	  mp->do_wrap, page_width, charset);
*946379e7Schristos
*946379e7Schristos  if (mp->msgid_plural == NULL)
*946379e7Schristos    wrap (mp, fp, "#~ ", extra_indent, "msgstr", mp->msgstr, mp->do_wrap,
*946379e7Schristos	  page_width, charset);
*946379e7Schristos  else
*946379e7Schristos    {
*946379e7Schristos      char prefix_buf[20];
*946379e7Schristos      unsigned int i;
*946379e7Schristos      const char *p;
*946379e7Schristos
*946379e7Schristos      for (p = mp->msgstr, i = 0;
*946379e7Schristos	   p < mp->msgstr + mp->msgstr_len;
*946379e7Schristos	   p += strlen (p) + 1, i++)
*946379e7Schristos	{
*946379e7Schristos	  sprintf (prefix_buf, "msgstr[%u]", i);
*946379e7Schristos	  wrap (mp, fp, "#~ ", extra_indent, prefix_buf, p, mp->do_wrap,
*946379e7Schristos		page_width, charset);
*946379e7Schristos	}
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristosstatic void
*946379e7Schristosmsgdomain_list_print_po (msgdomain_list_ty *mdlp, FILE *fp, size_t page_width,
*946379e7Schristos			 bool debug)
*946379e7Schristos{
*946379e7Schristos  size_t j, k;
*946379e7Schristos  bool blank_line;
*946379e7Schristos
*946379e7Schristos  /* Write out the messages for each domain.  */
*946379e7Schristos  blank_line = false;
*946379e7Schristos  for (k = 0; k < mdlp->nitems; k++)
*946379e7Schristos    {
*946379e7Schristos      message_list_ty *mlp;
*946379e7Schristos      const char *header;
*946379e7Schristos      const char *charset;
*946379e7Schristos      char *allocated_charset;
*946379e7Schristos
*946379e7Schristos      /* If the first domain is the default, don't bother emitting
*946379e7Schristos	 the domain name, because it is the default.  */
*946379e7Schristos      if (!(k == 0
*946379e7Schristos	    && strcmp (mdlp->item[k]->domain, MESSAGE_DOMAIN_DEFAULT) == 0))
*946379e7Schristos	{
*946379e7Schristos	  if (blank_line)
*946379e7Schristos	    print_blank_line (fp);
*946379e7Schristos	  fprintf (fp, "domain \"%s\"\n", mdlp->item[k]->domain);
*946379e7Schristos	  blank_line = true;
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      mlp = mdlp->item[k]->messages;
*946379e7Schristos
*946379e7Schristos      /* Search the header entry.  */
*946379e7Schristos      header = NULL;
*946379e7Schristos      for (j = 0; j < mlp->nitems; ++j)
*946379e7Schristos	if (is_header (mlp->item[j]) && !mlp->item[j]->obsolete)
*946379e7Schristos	  {
*946379e7Schristos	    header = mlp->item[j]->msgstr;
*946379e7Schristos	    break;
*946379e7Schristos	  }
*946379e7Schristos
*946379e7Schristos      /* Extract the charset name.  */
*946379e7Schristos      charset = "ASCII";
*946379e7Schristos      allocated_charset = NULL;
*946379e7Schristos      if (header != NULL)
*946379e7Schristos	{
*946379e7Schristos	  const char *charsetstr = c_strstr (header, "charset=");
*946379e7Schristos
*946379e7Schristos	  if (charsetstr != NULL)
*946379e7Schristos	    {
*946379e7Schristos	      size_t len;
*946379e7Schristos
*946379e7Schristos	      charsetstr += strlen ("charset=");
*946379e7Schristos	      len = strcspn (charsetstr, " \t\n");
*946379e7Schristos	      allocated_charset = (char *) xallocsa (len + 1);
*946379e7Schristos	      memcpy (allocated_charset, charsetstr, len);
*946379e7Schristos	      allocated_charset[len] = '\0';
*946379e7Schristos	      charset = allocated_charset;
*946379e7Schristos
*946379e7Schristos	      /* Treat the dummy default value as if it were absent.  */
*946379e7Schristos	      if (strcmp (charset, "CHARSET") == 0)
*946379e7Schristos		charset = "ASCII";
*946379e7Schristos	    }
*946379e7Schristos	}
*946379e7Schristos
*946379e7Schristos      /* Write out each of the messages for this domain.  */
*946379e7Schristos      for (j = 0; j < mlp->nitems; ++j)
*946379e7Schristos	if (!mlp->item[j]->obsolete)
*946379e7Schristos	  {
*946379e7Schristos	    message_print (mlp->item[j], fp, charset, page_width, blank_line,
*946379e7Schristos			   debug);
*946379e7Schristos	    blank_line = true;
*946379e7Schristos	  }
*946379e7Schristos
*946379e7Schristos      /* Write out each of the obsolete messages for this domain.  */
*946379e7Schristos      for (j = 0; j < mlp->nitems; ++j)
*946379e7Schristos	if (mlp->item[j]->obsolete)
*946379e7Schristos	  {
*946379e7Schristos	    message_print_obsolete (mlp->item[j], fp, charset, page_width,
*946379e7Schristos				    blank_line);
*946379e7Schristos	    blank_line = true;
*946379e7Schristos	  }
*946379e7Schristos
*946379e7Schristos      if (allocated_charset != NULL)
*946379e7Schristos	freesa (allocated_charset);
*946379e7Schristos    }
*946379e7Schristos}
*946379e7Schristos
*946379e7Schristos
*946379e7Schristos/* Describes a PO file in .po syntax.  */
*946379e7Schristosconst struct catalog_output_format output_format_po =
*946379e7Schristos{
*946379e7Schristos  msgdomain_list_print_po,		/* print */
*946379e7Schristos  false,				/* requires_utf8 */
*946379e7Schristos  true,					/* supports_multiple_domains */
*946379e7Schristos  true,					/* supports_contexts */
*946379e7Schristos  true,					/* supports_plurals */
*946379e7Schristos  false,				/* alternative_is_po */
*946379e7Schristos  false					/* alternative_is_java_class */
*946379e7Schristos};