128 lines
3.9 KiB
C
128 lines
3.9 KiB
C
#ifndef lint
|
|
static char *rcsid = "$Id: selectiveencode.c,v 1.1 2003/06/04 00:27:07 marka Exp $";
|
|
#endif
|
|
|
|
/*
|
|
* Copyright (c) 2000,2002 Japan Network Information Center.
|
|
* All rights reserved.
|
|
*
|
|
* By using this file, you agree to the terms and conditions set forth bellow.
|
|
*
|
|
* LICENSE TERMS AND CONDITIONS
|
|
*
|
|
* The following License Terms and Conditions apply, unless a different
|
|
* license is obtained from Japan Network Information Center ("JPNIC"),
|
|
* a Japanese association, Kokusai-Kougyou-Kanda Bldg 6F, 2-3-4 Uchi-Kanda,
|
|
* Chiyoda-ku, Tokyo 101-0047, Japan.
|
|
*
|
|
* 1. Use, Modification and Redistribution (including distribution of any
|
|
* modified or derived work) in source and/or binary forms is permitted
|
|
* under this License Terms and Conditions.
|
|
*
|
|
* 2. Redistribution of source code must retain the copyright notices as they
|
|
* appear in each source code file, this License Terms and Conditions.
|
|
*
|
|
* 3. Redistribution in binary form must reproduce the Copyright Notice,
|
|
* this License Terms and Conditions, in the documentation and/or other
|
|
* materials provided with the distribution. For the purposes of binary
|
|
* distribution the "Copyright Notice" refers to the following language:
|
|
* "Copyright (c) 2000-2002 Japan Network Information Center. All rights reserved."
|
|
*
|
|
* 4. The name of JPNIC may not be used to endorse or promote products
|
|
* derived from this Software without specific prior written approval of
|
|
* JPNIC.
|
|
*
|
|
* 5. Disclaimer/Limitation of Liability: THIS SOFTWARE IS PROVIDED BY JPNIC
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
|
|
* PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL JPNIC BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
|
|
* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
|
|
* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
|
|
* OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
|
|
* ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.
|
|
*/
|
|
|
|
#include <config.h>
|
|
|
|
#include <stddef.h>
|
|
|
|
#include <idn/assert.h>
|
|
#include <idn/logmacro.h>
|
|
#include <idn/result.h>
|
|
#include <idn/utf8.h>
|
|
#include <idn/debug.h>
|
|
|
|
#include "selectiveencode.h"
|
|
|
|
static int is_domain_delimiter(char c);
|
|
static char *find_nonascii(const char *s);
|
|
|
|
idn_result_t
|
|
idn_selectiveencode_findregion(const char *s,
|
|
char **startp, char **endp)
|
|
{
|
|
char *non_ascii;
|
|
char *start, *end;
|
|
|
|
assert(s != NULL && startp != NULL && endp != NULL);
|
|
|
|
TRACE(("idn_selectiveencode_findregion(s=\"%s\")\n",
|
|
idn__debug_xstring(s, 20)));
|
|
|
|
/*
|
|
* Scan the specified string looking for non-ascii character.
|
|
*/
|
|
if ((non_ascii = find_nonascii(s)) == NULL)
|
|
return (idn_notfound);
|
|
|
|
/*
|
|
* Non-ascii character found.
|
|
* Determine the region to encode.
|
|
*/
|
|
|
|
/*
|
|
* First, we scan backwards to find the beginning of the region
|
|
* that should be converted.
|
|
*/
|
|
start = non_ascii;
|
|
while (start > s) {
|
|
char *prev = idn_utf8_findfirstbyte(start - 1, s);
|
|
if (is_domain_delimiter(*prev))
|
|
break; /* Found */
|
|
start = prev;
|
|
}
|
|
*startp = start;
|
|
|
|
/*
|
|
* Next we scan forwards looking for the end of the region.
|
|
*/
|
|
end = non_ascii + idn_utf8_mblen(non_ascii);
|
|
while (!is_domain_delimiter(*end))
|
|
end += idn_utf8_mblen(end);
|
|
*endp = end;
|
|
|
|
return (idn_success);
|
|
}
|
|
|
|
static int
|
|
is_domain_delimiter(char c) {
|
|
return ((unsigned char)c < 0x80 &&
|
|
!('A' <= c && c <= 'Z') &&
|
|
!('a' <= c && c <= 'z') &&
|
|
!('0' <= c && c <= '9') &&
|
|
c != '-' && c != '.');
|
|
}
|
|
|
|
static char *
|
|
find_nonascii(const char *s) {
|
|
while (*s != '\0' && (unsigned char)*s < 0x80)
|
|
s++;
|
|
if (*s == '\0')
|
|
return (NULL);
|
|
else
|
|
return ((char *)s);
|
|
}
|