freeswitch/libs/sofia-sip/libsofia-sip-ua/ipt/ucs2.c

/*
 * This file is part of the Sofia-SIP package
 *
 * Copyright (C) 2005 Nokia Corporation.
 *
 * Contact: Pekka Pessi <pekka.pessi@nokia.com>
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public License
 * as published by the Free Software Foundation; either version 2.1 of
 * the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
 * 02110-1301 USA
 *
 */

/**@CFILE ucs2.c UCS2 (Unicode, ISO Basic Multilingual Plane) string handling.
 *
 * @author Pekka Pessi <Pekka.Pessi@nokia.com>
 *
 * @date Created: Tue Apr 21 15:32:02 1998 pessi
 *
 */

#include "config.h"

#include <sofia-sip/utf8.h>
#include "utf8internal.h"

/*
 * Decode utf8 string into ucs2 string,
 * return number of ucs2 characters decoded
 */
size_t ucs2decode(ucs2 *dst, size_t dst_size, const utf8 *s)
{
  ucs2 v, *d = dst;

  if (s) do {
    if (dst_size == 0)
      break;
    if (IS_UTF8_S1(s))
      v = UCS4_S1(s), s += 1;
    else if (IS_UTF8_S2(s))
      v = UCS4_S2(s), s += 2;
    else if (IS_UTF8_S3(s))
      v = UCS4_S3(s), s += 3;
    else {
      s++;
      continue;			/* skip illegal characters */
    }
    *d++ = v;
    dst_size--;
  } while (*s);

  if (dst_size)
    *d = 0;

  return d - dst;
}

/*
 * Encode ucs2 string into utf8 string,
 * return number of utf8 bytes encoded including final zero
 *
 * 'quote' may contain an optional quoting table containing
 * non-zero for all ASCII characters to quote
 *
 */
size_t ucs2encode(utf8 *dst, const ucs2 *s, size_t n, const char quote[128])
{
  utf8 *d = dst;
  ucs2 c;

  if (s) while (n-- > 0) {
    c = *s++;

    if (IS_UCS4_1(c)) {
      if (quote && quote[c]) {
	UTF8_S2(d, c);
	d += 2;
      }
      else {
	if (!c)			/* zero must be represented as UTF8_2 */
	  break;
	UTF8_S1(d, (utf8) c);
	d += 1;
      }
    }
    else if (IS_UCS4_2(c)) {
      UTF8_S2(d, c);
      d += 2;
    }
    else /* if (IS_UCS4_3(c)) */ {
      UTF8_S3(d, c);
      d += 3;
    }
  }

  *d++ = 0;
  return d - dst;
}

/*
 * Length of UCS2 (BMP, Unicode) string decoded from UTF8
 */
size_t ucs2declen(const utf8 *s)
{
  size_t len = 0;
  size_t errors = 0;		/* errors */

  UTF8_ANALYZE(s, len, len, len, errors, errors);

  if (errors)
    return 0;

  return len;
}

/*
 * Length of UTF8 encoding of a UCS2 string, including final zero
 */
size_t ucs2enclen(const ucs2 *s, size_t n, const char quote[128])
{
  size_t len = 1;
  ucs2 c;

  while (n-- > 0) {
    c = *s++;
    if (c < 0x80u)
      if (quote && quote[c])
	len += 2;
      else {
	if (!c) break;
	len += 1;
      }
    else if (c < 0x800u)
      len += 2;
    else /* if (c < 0x10000u) */
      len += 3;
  }

  return len;
}

/*
 * Length of UCS2 string (number of non-zero UCS2 characters before zero)
 */
size_t ucs2len(ucs2 const *s)
{
  size_t len = 0;

  if (s) while (*s++)
    len++;

  return len;
}

/*
 * Compare UCS2 (BMP, Unicode) string
 */
int ucs2cmp(ucs2 const *s1, ucs2 const *s2)
{
  int retval = s1 - s2;

  if (s1 && s2)
    while ((retval = (*s1 - *s2)) && (*s1++) && (*s2++))
      ;

  return retval;
}

/*
 * Compare UCS2 (BMP, Unicode) string
 */
int ucs2ncmp(ucs2 const *s1, ucs2 const *s2, size_t n)
{
  int retval = 0;

  if (s1 && s2)
    while (n-- > 0 && (retval = (*s1 - *s2)) && (*s1++) && (*s2++))
      ;

  return retval;
}
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`/*`
			`* This file is part of the Sofia-SIP package`
			`*`
			`* Copyright (C) 2005 Nokia Corporation.`
			`*`
			`* Contact: Pekka Pessi <pekka.pessi@nokia.com>`
			`*`
			`* This library is free software; you can redistribute it and/or`
			`* modify it under the terms of the GNU Lesser General Public License`
			`* as published by the Free Software Foundation; either version 2.1 of`
			`* the License, or (at your option) any later version.`
			`*`
			`* This library is distributed in the hope that it will be useful, but`
			`* WITHOUT ANY WARRANTY; without even the implied warranty of`
			`* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU`
			`* Lesser General Public License for more details.`
			`*`
			`* You should have received a copy of the GNU Lesser General Public`
			`* License along with this library; if not, write to the Free Software`
			`* Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA`
			`* 02110-1301 USA`
			`*`
			`*/`

			`/**@CFILE ucs2.c UCS2 (Unicode, ISO Basic Multilingual Plane) string handling.`
			`*`
			`* @author Pekka Pessi <Pekka.Pessi@nokia.com>`
			`*`
			`* @date Created: Tue Apr 21 15:32:02 1998 pessi`
			`*`
			`*/`

			`#include "config.h"`

			`#include <sofia-sip/utf8.h>`
			`#include "utf8internal.h"`

			`/*`
merge whitespace fixes from sofia-sip tree git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@10802 d0543943-73ff-0310-b7d9-9358b9ac24b2 2008-12-16 13:05:22 -05:00			`* Decode utf8 string into ucs2 string,`
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`* return number of ucs2 characters decoded`
			`*/`
			`size_t ucs2decode(ucs2 dst, size_t dst_size, const utf8 s)`
			`{`
			`ucs2 v, *d = dst;`

			`if (s) do {`
			`if (dst_size == 0)`
			`break;`
			`if (IS_UTF8_S1(s))`
			`v = UCS4_S1(s), s += 1;`
			`else if (IS_UTF8_S2(s))`
			`v = UCS4_S2(s), s += 2;`
			`else if (IS_UTF8_S3(s))`
			`v = UCS4_S3(s), s += 3;`
			`else {`
			`s++;`
			`continue; /* skip illegal characters */`
			`}`
			`*d++ = v;`
			`dst_size--;`
			`} while (*s);`

			`if (dst_size)`
			`*d = 0;`

			`return d - dst;`
			`}`

			`/*`
			`* Encode ucs2 string into utf8 string,`
			`* return number of utf8 bytes encoded including final zero`
			`*`
merge whitespace fixes from sofia-sip tree git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@10802 d0543943-73ff-0310-b7d9-9358b9ac24b2 2008-12-16 13:05:22 -05:00			`* 'quote' may contain an optional quoting table containing`
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`* non-zero for all ASCII characters to quote`
merge whitespace fixes from sofia-sip tree git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@10802 d0543943-73ff-0310-b7d9-9358b9ac24b2 2008-12-16 13:05:22 -05:00			`*`
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`*/`
			`size_t ucs2encode(utf8 dst, const ucs2 s, size_t n, const char quote[128])`
			`{`
			`utf8 *d = dst;`
			`ucs2 c;`

			`if (s) while (n-- > 0) {`
			`c = *s++;`

			`if (IS_UCS4_1(c)) {`
			`if (quote && quote[c]) {`
			`UTF8_S2(d, c);`
			`d += 2;`
			`}`
			`else {`
			`if (!c) /* zero must be represented as UTF8_2 */`
			`break;`
			`UTF8_S1(d, (utf8) c);`
			`d += 1;`
			`}`
			`}`
			`else if (IS_UCS4_2(c)) {`
			`UTF8_S2(d, c);`
			`d += 2;`
			`}`
			`else /* if (IS_UCS4_3(c)) */ {`
			`UTF8_S3(d, c);`
			`d += 3;`
			`}`
			`}`

			`*d++ = 0;`
			`return d - dst;`
			`}`

			`/*`
			`* Length of UCS2 (BMP, Unicode) string decoded from UTF8`
			`*/`
			`size_t ucs2declen(const utf8 *s)`
			`{`
			`size_t len = 0;`
			`size_t errors = 0; /* errors */`

			`UTF8_ANALYZE(s, len, len, len, errors, errors);`

			`if (errors)`
			`return 0;`

			`return len;`
			`}`

			`/*`
			`* Length of UTF8 encoding of a UCS2 string, including final zero`
			`*/`
			`size_t ucs2enclen(const ucs2 *s, size_t n, const char quote[128])`
			`{`
			`size_t len = 1;`
			`ucs2 c;`
merge whitespace fixes from sofia-sip tree git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@10802 d0543943-73ff-0310-b7d9-9358b9ac24b2 2008-12-16 13:05:22 -05:00
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`while (n-- > 0) {`
			`c = *s++;`
			`if (c < 0x80u)`
			`if (quote && quote[c])`
			`len += 2;`
			`else {`
			`if (!c) break;`
			`len += 1;`
			`}`
			`else if (c < 0x800u)`
			`len += 2;`
			`else /* if (c < 0x10000u) */`
			`len += 3;`
			`}`

			`return len;`
			`}`

			`/*`
			`* Length of UCS2 string (number of non-zero UCS2 characters before zero)`
			`*/`
			`size_t ucs2len(ucs2 const *s)`
			`{`
			`size_t len = 0;`

merge whitespace fixes from sofia-sip tree git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@10802 d0543943-73ff-0310-b7d9-9358b9ac24b2 2008-12-16 13:05:22 -05:00			`if (s) while (*s++)`
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`len++;`

			`return len;`
			`}`

			`/*`
			`* Compare UCS2 (BMP, Unicode) string`
			`*/`
			`int ucs2cmp(ucs2 const s1, ucs2 const s2)`
			`{`
			`int retval = s1 - s2;`

merge whitespace fixes from sofia-sip tree git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@10802 d0543943-73ff-0310-b7d9-9358b9ac24b2 2008-12-16 13:05:22 -05:00			`if (s1 && s2)`
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`while ((retval = (s1 - s2)) && (s1++) && (s2++))`
			`;`

			`return retval;`
			`}`

			`/*`
			`* Compare UCS2 (BMP, Unicode) string`
			`*/`
			`int ucs2ncmp(ucs2 const s1, ucs2 const s2, size_t n)`
			`{`
			`int retval = 0;`

merge whitespace fixes from sofia-sip tree git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@10802 d0543943-73ff-0310-b7d9-9358b9ac24b2 2008-12-16 13:05:22 -05:00			`if (s1 && s2)`
add sofia-sip 1.12.4 (plus some patches through 12/21/2006) to in tree libs git-svn-id: http://svn.freeswitch.org/svn/freeswitch/trunk@3774 d0543943-73ff-0310-b7d9-9358b9ac24b2 2006-12-21 01:30:28 -05:00			`while (n-- > 0 && (retval = (s1 - s2)) && (s1++) && (s2++))`
			`;`

			`return retval;`
			`}`