142 lines
4.8 KiB
C
142 lines
4.8 KiB
C
#ifndef lint
|
|
static char *rcsid = "$Id: selectiveencode.c,v 1.8 2001/05/31 05:21:38 ishisone Exp $";
|
|
#endif
|
|
|
|
/*
|
|
* Copyright (c) 2000 Japan Network Information Center. All rights reserved.
|
|
*
|
|
* By using this file, you agree to the terms and conditions set forth bellow.
|
|
*
|
|
* LICENSE TERMS AND CONDITIONS
|
|
*
|
|
* The following License Terms and Conditions apply, unless a different
|
|
* license is obtained from Japan Network Information Center ("JPNIC"),
|
|
* a Japanese association, Fuundo Bldg., 1-2 Kanda Ogawamachi, Chiyoda-ku,
|
|
* Tokyo, Japan.
|
|
*
|
|
* 1. Use, Modification and Redistribution (including distribution of any
|
|
* modified or derived work) in source and/or binary forms is permitted
|
|
* under this License Terms and Conditions.
|
|
*
|
|
* 2. Redistribution of source code must retain the copyright notices as they
|
|
* appear in each source code file, this License Terms and Conditions.
|
|
*
|
|
* 3. Redistribution in binary form must reproduce the Copyright Notice,
|
|
* this License Terms and Conditions, in the documentation and/or other
|
|
* materials provided with the distribution. For the purposes of binary
|
|
* distribution the "Copyright Notice" refers to the following language:
|
|
* "Copyright (c) Japan Network Information Center. All rights reserved."
|
|
*
|
|
* 4. Neither the name of JPNIC may be used to endorse or promote products
|
|
* derived from this Software without specific prior written approval of
|
|
* JPNIC.
|
|
*
|
|
* 5. Disclaimer/Limitation of Liability: THIS SOFTWARE IS PROVIDED BY JPNIC
|
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
|
|
* PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL JPNIC BE LIABLE
|
|
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
|
|
* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
|
|
* WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
|
|
* OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
|
|
* ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.
|
|
*
|
|
* 6. Indemnification by Licensee
|
|
* Any person or entities using and/or redistributing this Software under
|
|
* this License Terms and Conditions shall defend indemnify and hold
|
|
* harmless JPNIC from and against any and all judgements damages,
|
|
* expenses, settlement liabilities, cost and other liabilities of any
|
|
* kind as a result of use and redistribution of this Software or any
|
|
* claim, suite, action, litigation or proceeding by any third party
|
|
* arising out of or relates to this License Terms and Conditions.
|
|
*
|
|
* 7. Governing Law, Jurisdiction and Venue
|
|
* This License Terms and Conditions shall be governed by and and
|
|
* construed in accordance with the law of Japan. Any person or entities
|
|
* using and/or redistributing this Software under this License Terms and
|
|
* Conditions hereby agrees and consent to the personal and exclusive
|
|
* jurisdiction and venue of Tokyo District Court of Japan.
|
|
*/
|
|
|
|
#include <config.h>
|
|
|
|
#include <stddef.h>
|
|
|
|
#include <mdn/assert.h>
|
|
#include <mdn/logmacro.h>
|
|
#include <mdn/result.h>
|
|
#include <mdn/utf8.h>
|
|
#include <mdn/selectiveencode.h>
|
|
#include <mdn/debug.h>
|
|
|
|
static int is_domain_delimiter(char c);
|
|
static char *find_nonascii(const char *s);
|
|
|
|
mdn_result_t
|
|
mdn_selectiveencode_findregion(const char *s,
|
|
char **startp, char **endp)
|
|
{
|
|
char *non_ascii;
|
|
char *start, *end;
|
|
|
|
assert(s != NULL && startp != NULL && endp != NULL);
|
|
|
|
TRACE(("mdn_selectiveencode_findregion(s=\"%s\")\n",
|
|
mdn_debug_xstring(s, 20)));
|
|
|
|
/*
|
|
* Scan the specified string looking for non-ascii character.
|
|
*/
|
|
if ((non_ascii = find_nonascii(s)) == NULL)
|
|
return (mdn_notfound);
|
|
|
|
/*
|
|
* Non-ascii character found.
|
|
* Determine the region to encode.
|
|
*/
|
|
|
|
/*
|
|
* First, we scan backwards to find the beginning of the region
|
|
* that should be converted.
|
|
*/
|
|
start = non_ascii;
|
|
while (start > s) {
|
|
char *prev = mdn_utf8_findfirstbyte(start - 1, s);
|
|
if (is_domain_delimiter(*prev))
|
|
break; /* Found */
|
|
start = prev;
|
|
}
|
|
*startp = start;
|
|
|
|
/*
|
|
* Next we scan forwards looking for the end of the region.
|
|
*/
|
|
end = non_ascii + mdn_utf8_mblen(non_ascii);
|
|
while (!is_domain_delimiter(*end))
|
|
end += mdn_utf8_mblen(end);
|
|
*endp = end;
|
|
|
|
return (mdn_success);
|
|
}
|
|
|
|
static int
|
|
is_domain_delimiter(char c) {
|
|
return ((unsigned char)c < 0x80 &&
|
|
!('A' <= c && c <= 'Z') &&
|
|
!('a' <= c && c <= 'z') &&
|
|
!('0' <= c && c <= '9') &&
|
|
c != '-' && c != '.');
|
|
}
|
|
|
|
static char *
|
|
find_nonascii(const char *s) {
|
|
while (*s != '\0' && (unsigned char)*s < 0x80)
|
|
s++;
|
|
if (*s == '\0')
|
|
return (NULL);
|
|
else
|
|
return ((char *)s);
|
|
}
|