Blame inet/idna_name_classify.c

Packit 6c4009
/* Classify a domain name for IDNA purposes.
Packit 6c4009
   Copyright (C) 2018 Free Software Foundation, Inc.
Packit 6c4009
   This file is part of the GNU C Library.
Packit 6c4009
Packit 6c4009
   The GNU C Library is free software; you can redistribute it and/or
Packit 6c4009
   modify it under the terms of the GNU Lesser General Public
Packit 6c4009
   License as published by the Free Software Foundation; either
Packit 6c4009
   version 2.1 of the License, or (at your option) any later version.
Packit 6c4009
Packit 6c4009
   The GNU C Library is distributed in the hope that it will be useful,
Packit 6c4009
   but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 6c4009
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 6c4009
   Lesser General Public License for more details.
Packit 6c4009
Packit 6c4009
   You should have received a copy of the GNU Lesser General Public
Packit 6c4009
   License along with the GNU C Library; if not, see
Packit 6c4009
   <http://www.gnu.org/licenses/>.  */
Packit 6c4009
Packit 6c4009
#include <errno.h>
Packit 6c4009
#include <inet/net-internal.h>
Packit 6c4009
#include <stdbool.h>
Packit 6c4009
#include <string.h>
Packit 6c4009
#include <wchar.h>
Packit 6c4009
Packit 6c4009
enum idna_name_classification
Packit 6c4009
__idna_name_classify (const char *name)
Packit 6c4009
{
Packit 6c4009
  mbstate_t mbs;
Packit 6c4009
  memset (&mbs, 0, sizeof (mbs));
Packit 6c4009
  const char *p = name;
Packit 6c4009
  const char *end = p + strlen (p) + 1;
Packit 6c4009
  bool nonascii = false;
Packit 6c4009
  bool backslash = false;
Packit 6c4009
  while (true)
Packit 6c4009
    {
Packit 6c4009
      wchar_t wc;
Packit 6c4009
      size_t result = mbrtowc (&wc, p, end - p, &mbs);
Packit 6c4009
      if (result == 0)
Packit 6c4009
        /* NUL terminator was reached.  */
Packit 6c4009
        break;
Packit 6c4009
      else if (result == (size_t) -2)
Packit 6c4009
        /* Incomplete trailing multi-byte character.  This is an
Packit 6c4009
           encoding error becaue we received the full name.  */
Packit 6c4009
        return idna_name_encoding_error;
Packit 6c4009
      else if (result == (size_t) -1)
Packit 6c4009
        {
Packit 6c4009
          /* Other error, including EILSEQ.  */
Packit 6c4009
          if (errno == EILSEQ)
Packit 6c4009
            return idna_name_encoding_error;
Packit 6c4009
          else if (errno == ENOMEM)
Packit 6c4009
            return idna_name_memory_error;
Packit 6c4009
          else
Packit 6c4009
            return idna_name_error;
Packit 6c4009
        }
Packit 6c4009
      else
Packit 6c4009
        {
Packit 6c4009
          /* A wide character was decoded.  */
Packit 6c4009
          p += result;
Packit 6c4009
          if (wc == L'\\')
Packit 6c4009
            backslash = true;
Packit 6c4009
          else if (wc > 127)
Packit 6c4009
            nonascii = true;
Packit 6c4009
        }
Packit 6c4009
    }
Packit 6c4009
Packit 6c4009
  if (nonascii)
Packit 6c4009
    {
Packit 6c4009
      if (backslash)
Packit 6c4009
        return idna_name_nonascii_backslash;
Packit 6c4009
      else
Packit 6c4009
        return idna_name_nonascii;
Packit 6c4009
    }
Packit 6c4009
  else
Packit 6c4009
    return idna_name_ascii;
Packit 6c4009
}