1998-11-05 19:48:35 +03:00
/*
Unix SMB / Netbios implementation .
Version 1.9 .
Samba utility functions
Copyright ( C ) Andrew Tridgell 1992 - 1998
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation ; either version 2 of the License , or
( at your option ) any later version .
This program is distributed in the hope that it will be useful ,
but WITHOUT ANY WARRANTY ; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
along with this program ; if not , write to the Free Software
Foundation , Inc . , 675 Mass Ave , Cambridge , MA 0213 9 , USA .
*/
# include "includes.h"
1999-12-13 16:27:58 +03:00
extern int DEBUGLEVEL ;
1999-02-11 01:30:47 +03:00
1999-12-29 05:00:38 +03:00
smb_ucs2_t wchar_list_sep [ ] = { ( smb_ucs2_t ) ' ' , ( smb_ucs2_t ) ' \t ' , ( smb_ucs2_t ) ' , ' ,
( smb_ucs2_t ) ' ; ' , ( smb_ucs2_t ) ' : ' , ( smb_ucs2_t ) ' \n ' ,
( smb_ucs2_t ) ' \r ' , 0 } ;
1999-12-13 16:27:58 +03:00
/*
* The following are the codepage to ucs2 and vica versa maps .
* These are dynamically loaded from a unicode translation file .
*/
1999-02-15 08:31:52 +03:00
1999-12-13 16:27:58 +03:00
static smb_ucs2_t * doscp_to_ucs2 ;
static uint16 * ucs2_to_doscp ;
1998-11-05 19:48:35 +03:00
1999-12-13 16:27:58 +03:00
static smb_ucs2_t * unixcp_to_ucs2 ;
static uint16 * ucs2_to_unixcp ;
1998-11-05 19:48:35 +03:00
1999-12-13 16:27:58 +03:00
# ifndef MAXUNI
# define MAXUNI 1024
# endif
1999-02-11 01:30:47 +03:00
1998-11-05 19:48:35 +03:00
/*******************************************************************
1999-12-13 16:27:58 +03:00
Write a string in ( little - endian ) unicode format . src is in
the current DOS codepage . len is the length in bytes of the
string pointed to by dst .
1999-10-25 23:03:27 +04:00
2000-03-27 16:38:45 +04:00
if null_terminate is True then null terminate the packet ( adds 2 bytes )
2000-06-22 05:39:17 +04:00
the return value is the length in bytes consumed by the string , including the
2000-03-27 16:38:45 +04:00
null termination if applied
1999-12-13 16:27:58 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-15 08:31:52 +03:00
2000-06-22 05:39:17 +04:00
size_t dos_PutUniCode ( char * dst , const char * src , ssize_t len , BOOL null_terminate )
1999-12-13 16:27:58 +03:00
{
2000-06-22 05:39:17 +04:00
size_t ret = 0 ;
2000-06-23 21:31:38 +04:00
while ( * src & & ( len > = 2 ) ) {
2000-01-26 03:12:35 +03:00
size_t skip = get_character_len ( * src ) ;
1999-12-13 16:27:58 +03:00
smb_ucs2_t val = ( * src & 0xff ) ;
/*
* If this is a multibyte character ( and all DOS / Windows
* codepages have at maximum 2 byte multibyte characters )
* then work out the index value for the unicode conversion .
*/
if ( skip = = 2 )
1999-12-13 22:17:40 +03:00
val = ( ( val < < 8 ) | ( src [ 1 ] & 0xff ) ) ;
1999-12-13 16:27:58 +03:00
SSVAL ( dst , ret , doscp_to_ucs2 [ val ] ) ;
ret + = 2 ;
len - = 2 ;
if ( skip )
src + = skip ;
else
src + + ;
1998-11-05 19:48:35 +03:00
}
2000-03-27 16:38:45 +04:00
if ( null_terminate ) {
SSVAL ( dst , ret , 0 ) ;
ret + = 2 ;
}
1999-12-13 16:27:58 +03:00
return ( ret ) ;
}
1999-02-15 08:31:52 +03:00
2000-02-07 19:22:16 +03:00
/*******************************************************************
2000-05-11 02:47:09 +04:00
Pull a DOS codepage string out of a UNICODE array . len is in bytes .
2000-02-07 19:22:16 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2000-06-01 21:01:34 +04:00
void unistr_to_dos ( char * dest , const char * src , size_t len )
2000-02-07 19:22:16 +03:00
{
char * destend = dest + len ;
2000-04-30 15:04:28 +04:00
while ( dest < destend ) {
2000-05-11 02:47:09 +04:00
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
2000-04-30 15:04:28 +04:00
src + = 2 ;
2000-02-07 19:22:16 +03:00
2000-05-11 02:47:09 +04:00
if ( ucs2_val = = 0 )
break ;
if ( cp_val < 256 )
* dest + + = ( char ) cp_val ;
else {
* dest + + = ( cp_val > > 8 ) & 0xff ;
* dest + + = ( cp_val & 0xff ) ;
}
2000-02-07 19:22:16 +03:00
}
* dest = 0 ;
}
1999-12-13 16:27:58 +03:00
/*******************************************************************
2000-04-22 04:33:16 +04:00
Skip past a unicode string , but not more than len . Always move
past a terminating zero if found .
1999-12-13 16:27:58 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-10-08 02:10:29 +04:00
2000-04-22 04:33:16 +04:00
char * skip_unibuf ( char * src , size_t len )
1999-12-13 16:27:58 +03:00
{
2000-04-22 04:33:16 +04:00
char * srcend = src + len ;
while ( src < srcend & & SVAL ( src , 0 ) )
src + = 2 ;
if ( ! SVAL ( src , 0 ) )
src + = 2 ;
return src ;
1998-11-05 19:48:35 +03:00
}
/*******************************************************************
1999-12-13 16:27:58 +03:00
Return a DOS codepage version of a little - endian unicode string .
2000-03-22 23:39:31 +03:00
len is the filename length ( ignoring any terminating zero ) in uin16
units . Always null terminates .
1999-12-13 16:27:58 +03:00
Hack alert : uses fixed buffer ( s ) .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-11 01:30:47 +03:00
1999-12-13 16:27:58 +03:00
char * dos_unistrn2 ( uint16 * src , int len )
1998-11-05 19:48:35 +03:00
{
1999-12-13 16:27:58 +03:00
static char lbufs [ 8 ] [ MAXUNI ] ;
static int nexti ;
char * lbuf = lbufs [ nexti ] ;
char * p ;
nexti = ( nexti + 1 ) % 8 ;
for ( p = lbuf ; ( len > 0 ) & & ( p - lbuf < MAXUNI - 3 ) & & * src ; len - - , src + + ) {
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
if ( cp_val < 256 )
* p + + = ( char ) cp_val ;
else {
* p + + = ( cp_val > > 8 ) & 0xff ;
* p + + = ( cp_val & 0xff ) ;
1999-02-12 03:16:09 +03:00
}
1998-11-05 19:48:35 +03:00
}
1999-02-15 08:31:52 +03:00
1999-12-13 16:27:58 +03:00
* p = 0 ;
return lbuf ;
1998-11-05 19:48:35 +03:00
}
1999-12-13 16:27:58 +03:00
static char lbufs [ 8 ] [ MAXUNI ] ;
static int nexti ;
1998-11-10 22:05:00 +03:00
/*******************************************************************
1999-12-13 16:27:58 +03:00
Return a DOS codepage version of a little - endian unicode string .
Hack alert : uses fixed buffer ( s ) .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-11 01:30:47 +03:00
1999-12-13 16:27:58 +03:00
char * dos_unistr2 ( uint16 * src )
1998-11-10 22:05:00 +03:00
{
1999-12-13 16:27:58 +03:00
char * lbuf = lbufs [ nexti ] ;
char * p ;
nexti = ( nexti + 1 ) % 8 ;
2000-12-18 23:03:15 +03:00
for ( p = lbuf ; ( p - lbuf < MAXUNI - 3 ) & & * src ; src + + ) {
1999-12-13 16:27:58 +03:00
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
1999-02-15 08:31:52 +03:00
1999-12-13 16:27:58 +03:00
if ( cp_val < 256 )
* p + + = ( char ) cp_val ;
else {
* p + + = ( cp_val > > 8 ) & 0xff ;
* p + + = ( cp_val & 0xff ) ;
}
1998-11-10 22:05:00 +03:00
}
1999-02-15 08:31:52 +03:00
1999-12-13 16:27:58 +03:00
* p = 0 ;
return lbuf ;
1998-11-10 22:05:00 +03:00
}
/*******************************************************************
1999-12-13 16:27:58 +03:00
Return a DOS codepage version of a little - endian unicode string
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-11 01:30:47 +03:00
1999-12-13 16:27:58 +03:00
char * dos_unistr2_to_str ( UNISTR2 * str )
1998-11-10 22:05:00 +03:00
{
1999-12-13 16:27:58 +03:00
char * lbuf = lbufs [ nexti ] ;
char * p ;
uint16 * src = str - > buffer ;
2000-10-10 22:34:44 +04:00
int max_size = MIN ( MAXUNI - 3 , str - > uni_str_len ) ;
1999-12-13 16:27:58 +03:00
nexti = ( nexti + 1 ) % 8 ;
2000-12-18 23:03:15 +03:00
for ( p = lbuf ; ( p - lbuf < max_size ) & & * src ; src + + ) {
1999-12-13 16:27:58 +03:00
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
if ( cp_val < 256 )
* p + + = ( char ) cp_val ;
else {
* p + + = ( cp_val > > 8 ) & 0xff ;
* p + + = ( cp_val & 0xff ) ;
1998-11-10 22:05:00 +03:00
}
}
1999-02-15 08:31:52 +03:00
1999-12-13 16:27:58 +03:00
* p = 0 ;
return lbuf ;
1998-11-10 22:05:00 +03:00
}
2000-07-07 10:20:46 +04:00
/*******************************************************************
Put an ASCII string into a UNICODE array ( uint16 ' s ) .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void ascii_to_unistr ( uint16 * dest , const char * src , int maxlen )
{
uint16 * destend = dest + maxlen ;
register char c ;
while ( dest < destend )
{
c = * ( src + + ) ;
if ( c = = 0 )
{
break ;
}
* ( dest + + ) = ( uint16 ) c ;
}
* dest = 0 ;
}
/*******************************************************************
Pull an ASCII string out of a UNICODE array ( uint16 ' s ) .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void unistr_to_ascii ( char * dest , const uint16 * src , int len )
{
char * destend = dest + len ;
register uint16 c ;
2000-08-10 18:00:05 +04:00
if ( src = = NULL )
{
* dest = ' \0 ' ;
2000-08-12 18:20:40 +04:00
return ;
2000-08-10 18:00:05 +04:00
}
2000-08-12 18:20:40 +04:00
/* normal code path for a valid 'src' */
while ( dest < destend )
2000-08-10 18:00:05 +04:00
{
2000-08-12 18:20:40 +04:00
c = * ( src + + ) ;
if ( c = = 0 )
{
break ;
}
* ( dest + + ) = ( char ) c ;
2000-08-10 18:00:05 +04:00
}
2000-08-12 18:20:40 +04:00
* dest = 0 ;
return ;
2000-07-07 10:20:46 +04:00
}
2000-02-07 19:22:16 +03:00
/*******************************************************************
Convert a UNISTR2 structure to an ASCII string
Warning : this version does DOS codepage .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void unistr2_to_ascii ( char * dest , const UNISTR2 * str , size_t maxlen )
{
2000-12-15 12:31:56 +03:00
char * p ;
uint16 * src ;
2000-02-07 19:22:16 +03:00
size_t len ;
2000-12-15 12:31:56 +03:00
if ( str = = NULL ) {
* dest = ' \0 ' ;
return ;
}
2000-02-07 19:22:16 +03:00
src = str - > buffer ;
len = MIN ( str - > uni_str_len , maxlen ) ;
2000-12-15 12:31:56 +03:00
if ( len = = 0 ) {
* dest = ' \0 ' ;
return ;
}
2000-12-16 02:02:01 +03:00
for ( p = dest ; ( p - dest < len ) & & * src ; src + + ) {
2000-12-15 12:31:56 +03:00
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
2000-02-07 19:22:16 +03:00
if ( cp_val < 256 )
2000-12-15 12:31:56 +03:00
* p + + = ( char ) cp_val ;
2000-02-07 19:22:16 +03:00
else {
2000-12-15 12:31:56 +03:00
* p = ( cp_val > > 8 ) & 0xff ;
* p + + = ( cp_val & 0xff ) ;
2000-02-07 19:22:16 +03:00
}
}
2000-12-15 12:31:56 +03:00
* p = 0 ;
2000-02-07 19:22:16 +03:00
}
1999-02-12 03:16:09 +03:00
/*******************************************************************
1999-12-13 16:27:58 +03:00
Return a number stored in a buffer
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-11 21:50:13 +03:00
1999-12-13 16:27:58 +03:00
uint32 buffer2_to_uint32 ( BUFFER2 * str )
1999-02-12 03:16:09 +03:00
{
1999-12-13 16:27:58 +03:00
if ( str - > buf_len = = 4 )
return IVAL ( str - > buffer , 0 ) ;
else
return 0 ;
}
1999-02-11 21:50:13 +03:00
1999-12-13 16:27:58 +03:00
/*******************************************************************
Return a DOS codepage version of a NOTunicode string
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
char * dos_buffer2_to_str ( BUFFER2 * str )
{
char * lbuf = lbufs [ nexti ] ;
char * p ;
uint16 * src = str - > buffer ;
int max_size = MIN ( sizeof ( str - > buffer ) - 3 , str - > buf_len / 2 ) ;
nexti = ( nexti + 1 ) % 8 ;
2000-12-16 02:02:01 +03:00
for ( p = lbuf ; ( p - lbuf < max_size ) & & * src ; src + + ) {
1999-12-13 16:27:58 +03:00
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
if ( cp_val < 256 )
* p + + = ( char ) cp_val ;
else {
* p + + = ( cp_val > > 8 ) & 0xff ;
* p + + = ( cp_val & 0xff ) ;
}
1999-02-12 18:35:27 +03:00
}
1999-02-11 21:50:13 +03:00
1999-12-13 16:27:58 +03:00
* p = 0 ;
return lbuf ;
1999-02-11 21:50:13 +03:00
}
1998-11-05 19:48:35 +03:00
/*******************************************************************
1999-12-13 16:27:58 +03:00
Return a dos codepage version of a NOTunicode string
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-11 01:30:47 +03:00
1999-12-13 16:27:58 +03:00
char * dos_buffer2_to_multistr ( BUFFER2 * str )
1998-11-05 19:48:35 +03:00
{
1999-12-13 16:27:58 +03:00
char * lbuf = lbufs [ nexti ] ;
char * p ;
uint16 * src = str - > buffer ;
int max_size = MIN ( sizeof ( str - > buffer ) - 3 , str - > buf_len / 2 ) ;
nexti = ( nexti + 1 ) % 8 ;
for ( p = lbuf ; p - lbuf < max_size ; src + + ) {
if ( * src = = 0 ) {
* p + + = ' ' ;
} else {
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
if ( cp_val < 256 )
* p + + = ( char ) cp_val ;
else {
* p + + = ( cp_val > > 8 ) & 0xff ;
* p + + = ( cp_val & 0xff ) ;
}
1998-11-05 19:48:35 +03:00
}
}
1999-12-13 16:27:58 +03:00
* p = 0 ;
return lbuf ;
1998-11-05 19:48:35 +03:00
}
/*******************************************************************
1999-12-13 16:27:58 +03:00
Create a null - terminated unicode string from a null - terminated DOS
codepage string .
Return number of unicode chars copied , excluding the null character .
Unicode strings created are in little - endian format .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-02-11 01:30:47 +03:00
1999-12-13 16:27:58 +03:00
size_t dos_struni2 ( char * dst , const char * src , size_t max_len )
1998-11-05 19:48:35 +03:00
{
1999-12-13 16:27:58 +03:00
size_t len = 0 ;
if ( dst = = NULL )
1999-02-12 03:16:09 +03:00
return 0 ;
1999-12-13 16:27:58 +03:00
if ( src ! = NULL ) {
2000-12-16 02:02:01 +03:00
for ( ; ( len < max_len - 2 ) & & * src ; len + + , dst + = 2 ) {
2000-01-26 03:12:35 +03:00
size_t skip = get_character_len ( * src ) ;
1999-12-13 16:27:58 +03:00
smb_ucs2_t val = ( * src & 0xff ) ;
/*
* If this is a multibyte character ( and all DOS / Windows
* codepages have at maximum 2 byte multibyte characters )
* then work out the index value for the unicode conversion .
*/
if ( skip = = 2 )
1999-12-13 22:17:40 +03:00
val = ( ( val < < 8 ) | ( src [ 1 ] & 0xff ) ) ;
1999-12-13 16:27:58 +03:00
SSVAL ( dst , 0 , doscp_to_ucs2 [ val ] ) ;
if ( skip )
src + = skip ;
else
src + + ;
}
1998-11-05 19:48:35 +03:00
}
1999-12-13 16:27:58 +03:00
SSVAL ( dst , 0 , 0 ) ;
return len ;
}
1998-11-05 19:48:35 +03:00
/*******************************************************************
1999-12-13 16:27:58 +03:00
Return a DOS codepage version of a little - endian unicode string .
Hack alert : uses fixed buffer ( s ) .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
char * dos_unistr ( char * buf )
1998-11-05 19:48:35 +03:00
{
1999-12-13 16:27:58 +03:00
char * lbuf = lbufs [ nexti ] ;
uint16 * src = ( uint16 * ) buf ;
char * p ;
nexti = ( nexti + 1 ) % 8 ;
2000-12-16 02:02:01 +03:00
for ( p = lbuf ; ( p - lbuf < MAXUNI - 3 ) & & * src ; src + + ) {
1999-12-13 16:27:58 +03:00
uint16 ucs2_val = SVAL ( src , 0 ) ;
uint16 cp_val = ucs2_to_doscp [ ucs2_val ] ;
if ( cp_val < 256 )
* p + + = ( char ) cp_val ;
else {
* p + + = ( cp_val > > 8 ) & 0xff ;
* p + + = ( cp_val & 0xff ) ;
}
1998-11-05 19:48:35 +03:00
}
1999-12-13 16:27:58 +03:00
* p = 0 ;
return lbuf ;
1998-11-05 19:48:35 +03:00
}
1999-10-31 02:34:38 +04:00
/*******************************************************************
1999-12-13 16:27:58 +03:00
Strcpy for unicode strings . returns length ( in num of wide chars )
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
int unistrcpy ( char * dst , char * src )
1999-10-31 02:34:38 +04:00
{
1999-12-13 16:27:58 +03:00
int num_wchars = 0 ;
uint16 * wsrc = ( uint16 * ) src ;
uint16 * wdst = ( uint16 * ) dst ;
while ( * wsrc ) {
* wdst + + = * wsrc + + ;
num_wchars + + ;
1999-10-31 02:34:38 +04:00
}
1999-12-13 16:27:58 +03:00
* wdst = 0 ;
1999-10-31 02:34:38 +04:00
1999-12-13 16:27:58 +03:00
return num_wchars ;
1999-10-31 02:34:38 +04:00
}
1999-11-03 23:01:07 +03:00
1999-12-13 16:27:58 +03:00
1999-11-03 23:01:07 +03:00
/*******************************************************************
1999-12-22 02:14:01 +03:00
Free any existing maps .
1999-11-03 23:01:07 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-22 02:14:01 +03:00
1999-12-13 16:27:58 +03:00
static void free_maps ( smb_ucs2_t * * pp_cp_to_ucs2 , uint16 * * pp_ucs2_to_cp )
1999-11-03 23:01:07 +03:00
{
1999-12-13 16:27:58 +03:00
/* this handles identity mappings where we share the pointer */
if ( * pp_ucs2_to_cp = = * pp_cp_to_ucs2 ) {
* pp_ucs2_to_cp = NULL ;
1999-11-05 00:41:36 +03:00
}
1999-12-13 16:27:58 +03:00
if ( * pp_cp_to_ucs2 ) {
free ( * pp_cp_to_ucs2 ) ;
* pp_cp_to_ucs2 = NULL ;
1999-11-05 00:41:36 +03:00
}
1999-11-03 23:01:07 +03:00
1999-12-13 16:27:58 +03:00
if ( * pp_ucs2_to_cp ) {
free ( * pp_ucs2_to_cp ) ;
* pp_ucs2_to_cp = NULL ;
}
1999-11-03 23:01:07 +03:00
}
1999-12-13 16:27:58 +03:00
1999-11-03 23:01:07 +03:00
/*******************************************************************
1999-12-13 16:27:58 +03:00
Build a default ( null ) codepage to unicode map .
1999-11-03 23:01:07 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-13 16:27:58 +03:00
void default_unicode_map ( smb_ucs2_t * * pp_cp_to_ucs2 , uint16 * * pp_ucs2_to_cp )
1999-11-03 23:01:07 +03:00
{
1999-12-13 16:27:58 +03:00
int i ;
free_maps ( pp_cp_to_ucs2 , pp_ucs2_to_cp ) ;
if ( ( * pp_ucs2_to_cp = ( uint16 * ) malloc ( 2 * 65536 ) ) = = NULL ) {
DEBUG ( 0 , ( " default_unicode_map: malloc fail for ucs2_to_cp size %u. \n " , 2 * 65536 ) ) ;
abort ( ) ;
}
* pp_cp_to_ucs2 = * pp_ucs2_to_cp ; /* Default map is an identity. */
for ( i = 0 ; i < 65536 ; i + + )
( * pp_cp_to_ucs2 ) [ i ] = i ;
1999-11-03 23:01:07 +03:00
}
/*******************************************************************
1999-12-13 16:27:58 +03:00
Load a codepage to unicode and vica - versa map .
1999-11-03 23:01:07 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-13 16:27:58 +03:00
BOOL load_unicode_map ( const char * codepage , smb_ucs2_t * * pp_cp_to_ucs2 , uint16 * * pp_ucs2_to_cp )
1999-11-03 23:01:07 +03:00
{
1999-12-13 16:27:58 +03:00
pstring unicode_map_file_name ;
FILE * fp = NULL ;
SMB_STRUCT_STAT st ;
smb_ucs2_t * cp_to_ucs2 = * pp_cp_to_ucs2 ;
uint16 * ucs2_to_cp = * pp_ucs2_to_cp ;
size_t cp_to_ucs2_size ;
size_t ucs2_to_cp_size ;
size_t i ;
size_t size ;
char buf [ UNICODE_MAP_HEADER_SIZE ] ;
DEBUG ( 5 , ( " load_unicode_map: loading unicode map for codepage %s. \n " , codepage ) ) ;
if ( * codepage = = ' \0 ' )
goto clean_and_exit ;
2000-12-01 04:14:55 +03:00
if ( strlen ( lp_codepagedir ( ) ) + 13 + strlen ( codepage ) >
sizeof ( unicode_map_file_name ) ) {
1999-12-13 16:27:58 +03:00
DEBUG ( 0 , ( " load_unicode_map: filename too long to load \n " ) ) ;
goto clean_and_exit ;
}
2000-12-01 04:14:55 +03:00
pstrcpy ( unicode_map_file_name , lp_codepagedir ( ) ) ;
1999-12-13 16:27:58 +03:00
pstrcat ( unicode_map_file_name , " / " ) ;
pstrcat ( unicode_map_file_name , " unicode_map. " ) ;
pstrcat ( unicode_map_file_name , codepage ) ;
if ( sys_stat ( unicode_map_file_name , & st ) ! = 0 ) {
DEBUG ( 0 , ( " load_unicode_map: filename %s does not exist. \n " ,
unicode_map_file_name ) ) ;
goto clean_and_exit ;
}
size = st . st_size ;
if ( ( size ! = UNICODE_MAP_HEADER_SIZE + 4 * 65536 ) & & ( size ! = UNICODE_MAP_HEADER_SIZE + ( 2 * 256 + 2 * 65536 ) ) ) {
DEBUG ( 0 , ( " load_unicode_map: file %s is an incorrect size for a \
unicode map file ( size = % d ) . \ n " , unicode_map_file_name, (int)size)) ;
goto clean_and_exit ;
}
if ( ( fp = sys_fopen ( unicode_map_file_name , " r " ) ) = = NULL ) {
DEBUG ( 0 , ( " load_unicode_map: cannot open file %s. Error was %s \n " ,
unicode_map_file_name , strerror ( errno ) ) ) ;
goto clean_and_exit ;
}
if ( fread ( buf , 1 , UNICODE_MAP_HEADER_SIZE , fp ) ! = UNICODE_MAP_HEADER_SIZE ) {
DEBUG ( 0 , ( " load_unicode_map: cannot read header from file %s. Error was %s \n " ,
unicode_map_file_name , strerror ( errno ) ) ) ;
goto clean_and_exit ;
}
/* Check the version value */
if ( SVAL ( buf , UNICODE_MAP_VERSION_OFFSET ) ! = UNICODE_MAP_FILE_VERSION_ID ) {
DEBUG ( 0 , ( " load_unicode_map: filename %s has incorrect version id. \
Needed % hu , got % hu . \ n " ,
unicode_map_file_name , ( uint16 ) UNICODE_MAP_FILE_VERSION_ID ,
SVAL ( buf , UNICODE_MAP_VERSION_OFFSET ) ) ) ;
goto clean_and_exit ;
}
/* Check the codepage value */
if ( ! strequal ( & buf [ UNICODE_MAP_CLIENT_CODEPAGE_OFFSET ] , codepage ) ) {
DEBUG ( 0 , ( " load_unicode_map: codepage %s in file %s is not the same as that \
requested ( % s ) . \ n " , &buf[UNICODE_MAP_CLIENT_CODEPAGE_OFFSET], unicode_map_file_name, codepage ));
goto clean_and_exit ;
}
ucs2_to_cp_size = 2 * 65536 ;
if ( size = = UNICODE_MAP_HEADER_SIZE + 4 * 65536 ) {
/*
* This is a multibyte code page .
*/
cp_to_ucs2_size = 2 * 65536 ;
} else {
/*
* Single byte code page .
*/
cp_to_ucs2_size = 2 * 256 ;
}
/*
* Free any old translation tables .
*/
free_maps ( pp_cp_to_ucs2 , pp_ucs2_to_cp ) ;
if ( ( cp_to_ucs2 = ( smb_ucs2_t * ) malloc ( cp_to_ucs2_size ) ) = = NULL ) {
DEBUG ( 0 , ( " load_unicode_map: malloc fail for cp_to_ucs2 size %u. \n " , cp_to_ucs2_size ) ) ;
goto clean_and_exit ;
}
if ( ( ucs2_to_cp = ( uint16 * ) malloc ( ucs2_to_cp_size ) ) = = NULL ) {
DEBUG ( 0 , ( " load_unicode_map: malloc fail for ucs2_to_cp size %u. \n " , ucs2_to_cp_size ) ) ;
goto clean_and_exit ;
}
if ( fread ( ( char * ) cp_to_ucs2 , 1 , cp_to_ucs2_size , fp ) ! = cp_to_ucs2_size ) {
DEBUG ( 0 , ( " load_unicode_map: cannot read cp_to_ucs2 from file %s. Error was %s \n " ,
unicode_map_file_name , strerror ( errno ) ) ) ;
goto clean_and_exit ;
}
if ( fread ( ( char * ) ucs2_to_cp , 1 , ucs2_to_cp_size , fp ) ! = ucs2_to_cp_size ) {
DEBUG ( 0 , ( " load_unicode_map: cannot read ucs2_to_cp from file %s. Error was %s \n " ,
unicode_map_file_name , strerror ( errno ) ) ) ;
goto clean_and_exit ;
}
/*
* Now ensure the 16 bit values are in the correct endianness .
*/
for ( i = 0 ; i < cp_to_ucs2_size / 2 ; i + + )
cp_to_ucs2 [ i ] = SVAL ( cp_to_ucs2 , i * 2 ) ;
for ( i = 0 ; i < ucs2_to_cp_size / 2 ; i + + )
ucs2_to_cp [ i ] = SVAL ( ucs2_to_cp , i * 2 ) ;
fclose ( fp ) ;
* pp_cp_to_ucs2 = cp_to_ucs2 ;
* pp_ucs2_to_cp = ucs2_to_cp ;
return True ;
clean_and_exit :
/* pseudo destructor :-) */
if ( fp ! = NULL )
fclose ( fp ) ;
free_maps ( pp_cp_to_ucs2 , pp_ucs2_to_cp ) ;
default_unicode_map ( pp_cp_to_ucs2 , pp_ucs2_to_cp ) ;
return False ;
}
/*******************************************************************
Load a dos codepage to unicode and vica - versa map .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL load_dos_unicode_map ( int codepage )
{
fstring codepage_str ;
slprintf ( codepage_str , sizeof ( fstring ) - 1 , " %03d " , codepage ) ;
return load_unicode_map ( codepage_str , & doscp_to_ucs2 , & ucs2_to_doscp ) ;
}
/*******************************************************************
Load a UNIX codepage to unicode and vica - versa map .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL load_unix_unicode_map ( const char * unix_char_set )
{
fstring upper_unix_char_set ;
fstrcpy ( upper_unix_char_set , unix_char_set ) ;
strupper ( upper_unix_char_set ) ;
return load_unicode_map ( upper_unix_char_set , & unixcp_to_ucs2 , & ucs2_to_unixcp ) ;
1999-11-03 23:01:07 +03:00
}
1999-12-22 02:14:01 +03:00
/*******************************************************************
The following functions reproduce many of the non - UNICODE standard
string functions in Samba .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
/*******************************************************************
Convert a UNICODE string to multibyte format . Note that the ' src ' is in
native byte order , not little endian . Always zero terminates .
dst_len is in bytes .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
static char * unicode_to_multibyte ( char * dst , const smb_ucs2_t * src ,
size_t dst_len , const uint16 * ucs2_to_cp )
{
1999-12-23 21:58:44 +03:00
size_t dst_pos ;
1999-12-22 02:14:01 +03:00
2000-12-16 02:02:01 +03:00
for ( dst_pos = 0 ; ( dst_pos < dst_len - 1 ) & & * src ; ) {
1999-12-23 21:58:44 +03:00
smb_ucs2_t val = ucs2_to_cp [ * src + + ] ;
1999-12-22 02:14:01 +03:00
if ( val < 256 ) {
1999-12-23 21:58:44 +03:00
dst [ dst_pos + + ] = ( char ) val ;
} else {
if ( dst_pos > = dst_len - 2 )
break ;
1999-12-22 02:14:01 +03:00
/*
* A 2 byte value is always written as
* high / low into the buffer stream .
*/
1999-12-23 21:58:44 +03:00
dst [ dst_pos + + ] = ( char ) ( ( val > > 8 ) & 0xff ) ;
dst [ dst_pos + + ] = ( char ) ( val & 0xff ) ;
1999-12-22 02:14:01 +03:00
}
}
1999-12-23 21:58:44 +03:00
dst [ dst_pos ] = ' \0 ' ;
1999-12-22 02:14:01 +03:00
return dst ;
}
/*******************************************************************
Convert a multibyte string to UNICODE format . Note that the ' dst ' is in
native byte order , not little endian . Always zero terminates .
dst_len is in bytes .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * multibyte_to_unicode ( smb_ucs2_t * dst , const char * src ,
size_t dst_len , smb_ucs2_t * cp_to_ucs2 )
{
size_t i ;
dst_len / = sizeof ( smb_ucs2_t ) ; /* Convert to smb_ucs2_t units. */
for ( i = 0 ; ( i < ( dst_len - 1 ) ) & & src [ i ] ; ) {
2000-03-22 22:03:12 +03:00
size_t skip = skip_multibyte_char ( * src ) ;
1999-12-22 02:14:01 +03:00
smb_ucs2_t val = ( * src & 0xff ) ;
/*
* If this is a multibyte character
* then work out the index value for the unicode conversion .
*/
if ( skip = = 2 )
val = ( ( val < < 8 ) | ( src [ 1 ] & 0xff ) ) ;
dst [ i + + ] = cp_to_ucs2 [ val ] ;
if ( skip )
src + = skip ;
else
src + + ;
}
dst [ i ] = 0 ;
return dst ;
}
/*******************************************************************
Convert a UNICODE string to multibyte format . Note that the ' src ' is in
native byte order , not little endian . Always zero terminates .
This function may be replaced if the MB codepage format is an
encoded one ( ie . utf8 , hex ) . See the code in lib / kanji . c
for details . dst_len is in bytes .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
char * unicode_to_unix ( char * dst , const smb_ucs2_t * src , size_t dst_len )
{
return unicode_to_multibyte ( dst , src , dst_len , ucs2_to_unixcp ) ;
}
/*******************************************************************
Convert a UNIX string to UNICODE format . Note that the ' dst ' is in
native byte order , not little endian . Always zero terminates .
This function may be replaced if the UNIX codepage format is a
multi - byte one ( ie . JIS , SJIS or utf8 ) . See the code in lib / kanji . c
for details . dst_len is in bytes , not ucs2 units .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * unix_to_unicode ( smb_ucs2_t * dst , const char * src , size_t dst_len )
{
return multibyte_to_unicode ( dst , src , dst_len , unixcp_to_ucs2 ) ;
}
/*******************************************************************
Convert a UNICODE string to DOS format . Note that the ' src ' is in
native byte order , not little endian . Always zero terminates .
dst_len is in bytes .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
char * unicode_to_dos ( char * dst , const smb_ucs2_t * src , size_t dst_len )
{
return unicode_to_multibyte ( dst , src , dst_len , ucs2_to_doscp ) ;
}
2000-05-12 18:28:48 +04:00
/*******************************************************************
Convert a single UNICODE character to DOS codepage . Returns the
number of bytes in the DOS codepage character .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
size_t unicode_to_dos_char ( char * dst , const smb_ucs2_t src )
{
smb_ucs2_t val = ucs2_to_doscp [ src ] ;
if ( val < 256 ) {
* dst = ( char ) val ;
return ( size_t ) 1 ;
}
/*
* A 2 byte value is always written as
* high / low into the buffer stream .
*/
dst [ 0 ] = ( char ) ( ( val > > 8 ) & 0xff ) ;
dst [ 1 ] = ( char ) ( val & 0xff ) ;
return ( size_t ) 2 ;
}
1999-12-22 02:14:01 +03:00
/*******************************************************************
Convert a DOS string to UNICODE format . Note that the ' dst ' is in
native byte order , not little endian . Always zero terminates .
This function may be replaced if the DOS codepage format is a
multi - byte one ( ie . JIS , SJIS or utf8 ) . See the code in lib / kanji . c
for details . dst_len is in bytes , not ucs2 units .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * dos_to_unicode ( smb_ucs2_t * dst , const char * src , size_t dst_len )
{
return multibyte_to_unicode ( dst , src , dst_len , doscp_to_ucs2 ) ;
}
/*******************************************************************
Count the number of characters in a smb_ucs2_t string .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
size_t strlen_w ( const smb_ucs2_t * src )
1999-12-22 02:14:01 +03:00
{
size_t len ;
2001-02-20 11:09:06 +03:00
for ( len = 0 ; * src + + ; len + + )
1999-12-22 02:14:01 +03:00
;
return len ;
}
/*******************************************************************
Safe wstring copy into a known length string . maxlength includes
2000-03-22 22:03:12 +03:00
the terminating zero . maxlength is in ucs2 units .
1999-12-22 02:14:01 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t * safe_strcpy_w ( smb_ucs2_t * dest , const smb_ucs2_t * src , size_t maxlength )
1999-12-22 02:14:01 +03:00
{
size_t ucs2_len ;
if ( ! dest ) {
1999-12-29 05:00:38 +03:00
DEBUG ( 0 , ( " ERROR: NULL dest in safe_strcpy_w \n " ) ) ;
1999-12-22 02:14:01 +03:00
return NULL ;
}
if ( ! src ) {
* dest = 0 ;
return dest ;
}
1999-12-29 05:00:38 +03:00
maxlength / = sizeof ( smb_ucs2_t ) ;
ucs2_len = strlen_w ( src ) ;
if ( ucs2_len > = maxlength ) {
1999-12-22 02:14:01 +03:00
fstring out ;
1999-12-29 05:00:38 +03:00
DEBUG ( 0 , ( " ERROR: string overflow by %u bytes in safe_strcpy_w [%.50s] \n " ,
( unsigned int ) ( ( ucs2_len - maxlength ) * sizeof ( smb_ucs2_t ) ) ,
1999-12-22 02:14:01 +03:00
unicode_to_unix ( out , src , sizeof ( out ) ) ) ) ;
1999-12-29 05:00:38 +03:00
ucs2_len = maxlength - 1 ;
1999-12-22 02:14:01 +03:00
}
memcpy ( dest , src , ucs2_len * sizeof ( smb_ucs2_t ) ) ;
dest [ ucs2_len ] = 0 ;
return dest ;
}
/*******************************************************************
Safe string cat into a string . maxlength includes the terminating zero .
2000-03-22 22:03:12 +03:00
maxlength is in ucs2 units .
1999-12-22 02:14:01 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t * safe_strcat_w ( smb_ucs2_t * dest , const smb_ucs2_t * src , size_t maxlength )
1999-12-22 02:14:01 +03:00
{
size_t ucs2_src_len , ucs2_dest_len ;
if ( ! dest ) {
1999-12-29 05:00:38 +03:00
DEBUG ( 0 , ( " ERROR: NULL dest in safe_strcat_w \n " ) ) ;
1999-12-22 02:14:01 +03:00
return NULL ;
}
1999-12-29 05:00:38 +03:00
if ( ! src )
1999-12-22 02:14:01 +03:00
return dest ;
1999-12-29 05:00:38 +03:00
ucs2_src_len = strlen_w ( src ) ;
ucs2_dest_len = strlen_w ( dest ) ;
if ( ucs2_src_len + ucs2_dest_len > = maxlength ) {
1999-12-22 02:14:01 +03:00
fstring out ;
1999-12-29 05:00:38 +03:00
int new_len = maxlength - ucs2_dest_len - 1 ;
DEBUG ( 0 , ( " ERROR: string overflow by %u characters in safe_strcat_w [%.50s] \n " ,
( unsigned int ) ( sizeof ( smb_ucs2_t ) * ( ucs2_src_len + ucs2_dest_len - maxlength ) ) ,
1999-12-22 02:14:01 +03:00
unicode_to_unix ( out , src , sizeof ( out ) ) ) ) ;
ucs2_src_len = ( size_t ) ( new_len > 0 ? new_len : 0 ) ;
}
memcpy ( & dest [ ucs2_dest_len ] , src , ucs2_src_len * sizeof ( smb_ucs2_t ) ) ;
dest [ ucs2_dest_len + ucs2_src_len ] = 0 ;
return dest ;
}
1999-12-22 03:17:35 +03:00
/*******************************************************************
2000-03-22 22:03:12 +03:00
Compare the two strings s1 and s2 .
1999-12-22 03:17:35 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
int strcmp_w ( const smb_ucs2_t * s1 , const smb_ucs2_t * s2 )
1999-12-22 03:17:35 +03:00
{
smb_ucs2_t c1 , c2 ;
for ( ; ; ) {
c1 = * s1 + + ;
c2 = * s2 + + ;
if ( c1 ! = c2 )
return c1 - c2 ;
if ( c1 = = 0 )
2000-10-04 05:03:23 +04:00
break ;
}
1999-12-22 03:17:35 +03:00
return 0 ;
}
/*******************************************************************
Compare the first n characters of s1 to s2 . len is in ucs2 units .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
int strncmp_w ( const smb_ucs2_t * s1 , const smb_ucs2_t * s2 , size_t len )
1999-12-22 03:17:35 +03:00
{
smb_ucs2_t c1 , c2 ;
for ( ; len ! = 0 ; - - len ) {
c1 = * s1 + + ;
c2 = * s2 + + ;
if ( c1 ! = c2 )
return c1 - c2 ;
if ( c1 = = 0 )
2000-10-04 05:03:23 +04:00
break ;
1999-12-22 03:17:35 +03:00
2000-10-04 05:03:23 +04:00
}
1999-12-22 03:17:35 +03:00
return 0 ;
}
/*******************************************************************
Search string s2 from s1 .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t * strstr_w ( const smb_ucs2_t * s1 , const smb_ucs2_t * s2 )
1999-12-22 03:17:35 +03:00
{
1999-12-29 05:00:38 +03:00
size_t len = strlen_w ( s2 ) ;
1999-12-22 03:17:35 +03:00
if ( ! * s2 )
return ( smb_ucs2_t * ) s1 ;
for ( ; * s1 ; s1 + + ) {
if ( * s1 = = * s2 ) {
1999-12-29 05:00:38 +03:00
if ( strncmp_w ( s1 , s2 , len ) = = 0 )
1999-12-22 03:17:35 +03:00
return ( smb_ucs2_t * ) s1 ;
}
}
return NULL ;
}
/*******************************************************************
Search for ucs2 char c from the beginning of s .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t * strchr_w ( const smb_ucs2_t * s , smb_ucs2_t c )
1999-12-22 03:17:35 +03:00
{
do {
if ( * s = = c )
return ( smb_ucs2_t * ) s ;
} while ( * s + + ) ;
return NULL ;
}
/*******************************************************************
Search for ucs2 char c from the end of s .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t * strrchr_w ( const smb_ucs2_t * s , smb_ucs2_t c )
1999-12-22 03:17:35 +03:00
{
smb_ucs2_t * retval = 0 ;
do {
if ( * s = = c )
retval = ( smb_ucs2_t * ) s ;
} while ( * s + + ) ;
return retval ;
}
/*******************************************************************
Search token from s1 separated by any ucs2 char of s2 .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t * strtok_w ( smb_ucs2_t * s1 , const smb_ucs2_t * s2 )
1999-12-22 03:17:35 +03:00
{
static smb_ucs2_t * s = NULL ;
smb_ucs2_t * q ;
if ( ! s1 ) {
if ( ! s )
return NULL ;
s1 = s ;
}
for ( q = s1 ; * s1 ; s1 + + ) {
1999-12-29 05:00:38 +03:00
smb_ucs2_t * p = strchr_w ( s2 , * s1 ) ;
1999-12-22 03:17:35 +03:00
if ( p ) {
if ( s1 ! = q ) {
s = s1 + 1 ;
* s1 = ' \0 ' ;
return q ;
}
q = s1 + 1 ;
}
}
s = NULL ;
if ( * q )
return q ;
return NULL ;
}
1999-12-22 21:46:05 +03:00
/*******************************************************************
Duplicate a ucs2 string .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t * strdup_w ( const smb_ucs2_t * s )
1999-12-22 21:46:05 +03:00
{
1999-12-29 05:00:38 +03:00
size_t newlen = ( strlen_w ( s ) + 1 ) * sizeof ( smb_ucs2_t ) ;
1999-12-22 21:46:05 +03:00
smb_ucs2_t * newstr = ( smb_ucs2_t * ) malloc ( newlen ) ;
if ( newstr = = NULL )
return NULL ;
1999-12-29 05:00:38 +03:00
safe_strcpy_w ( newstr , s , newlen ) ;
1999-12-22 21:46:05 +03:00
return newstr ;
}
1999-12-23 04:57:43 +03:00
/*******************************************************************
Mapping tables for UNICODE character . Allows toupper / tolower and
isXXX functions to work .
2000-04-15 11:14:40 +04:00
tridge : split into 2 pieces . This saves us 5 / 6 of the memory
with a small speed penalty
The magic constants are the lower / upper range of the tables two
parts
1999-12-23 04:57:43 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
typedef struct {
smb_ucs2_t lower ;
smb_ucs2_t upper ;
unsigned char flags ;
} smb_unicode_table_t ;
2000-04-15 12:07:11 +04:00
# define TABLE1_BOUNDARY 9450
# define TABLE2_BOUNDARY 64256
2000-04-15 11:14:40 +04:00
static smb_unicode_table_t map_table1 [ ] = {
# include "unicode_map_table1.h"
} ;
static smb_unicode_table_t map_table2 [ ] = {
# include "unicode_map_table2.h"
1999-12-23 04:57:43 +03:00
} ;
2000-04-15 11:14:40 +04:00
static unsigned char map_table_flags ( smb_ucs2_t v )
{
2000-04-15 12:07:11 +04:00
if ( v < TABLE1_BOUNDARY ) return map_table1 [ v ] . flags ;
if ( v > = TABLE2_BOUNDARY ) return map_table2 [ v - TABLE2_BOUNDARY ] . flags ;
2000-04-15 11:14:40 +04:00
return 0 ;
}
static smb_ucs2_t map_table_lower ( smb_ucs2_t v )
{
2000-04-15 12:07:11 +04:00
if ( v < TABLE1_BOUNDARY ) return map_table1 [ v ] . lower ;
if ( v > = TABLE2_BOUNDARY ) return map_table2 [ v - TABLE2_BOUNDARY ] . lower ;
2000-04-15 11:14:40 +04:00
return v ;
}
static smb_ucs2_t map_table_upper ( smb_ucs2_t v )
{
2000-04-15 12:07:11 +04:00
if ( v < TABLE1_BOUNDARY ) return map_table1 [ v ] . upper ;
if ( v > = TABLE2_BOUNDARY ) return map_table2 [ v - TABLE2_BOUNDARY ] . upper ;
2000-04-15 11:14:40 +04:00
return v ;
}
1999-12-23 04:57:43 +03:00
/*******************************************************************
Is an upper case wchar .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
int isupper_w ( smb_ucs2_t val )
1999-12-23 04:57:43 +03:00
{
2000-04-15 11:14:40 +04:00
return ( map_table_flags ( val ) & UNI_UPPER ) ;
1999-12-23 04:57:43 +03:00
}
1999-12-23 21:58:44 +03:00
1999-12-23 04:57:43 +03:00
/*******************************************************************
Is a lower case wchar .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
int islower_w ( smb_ucs2_t val )
1999-12-23 04:57:43 +03:00
{
2000-04-15 11:14:40 +04:00
return ( map_table_flags ( val ) & UNI_LOWER ) ;
1999-12-23 04:57:43 +03:00
}
1999-12-23 21:58:44 +03:00
1999-12-23 04:57:43 +03:00
/*******************************************************************
Is a digit wchar .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
int isdigit_w ( smb_ucs2_t val )
1999-12-23 04:57:43 +03:00
{
2000-04-15 11:14:40 +04:00
return ( map_table_flags ( val ) & UNI_DIGIT ) ;
1999-12-23 04:57:43 +03:00
}
1999-12-23 21:58:44 +03:00
1999-12-23 04:57:43 +03:00
/*******************************************************************
Is a hex digit wchar .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
int isxdigit_w ( smb_ucs2_t val )
1999-12-23 04:57:43 +03:00
{
2000-04-15 11:14:40 +04:00
return ( map_table_flags ( val ) & UNI_XDIGIT ) ;
1999-12-23 04:57:43 +03:00
}
1999-12-23 05:01:37 +03:00
1999-12-23 04:57:43 +03:00
/*******************************************************************
Is a space wchar .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
int isspace_w ( smb_ucs2_t val )
1999-12-23 04:57:43 +03:00
{
2000-04-15 11:14:40 +04:00
return ( map_table_flags ( val ) & UNI_SPACE ) ;
1999-12-23 04:57:43 +03:00
}
1999-12-23 05:01:37 +03:00
/*******************************************************************
Convert a wchar to upper case .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t toupper_w ( smb_ucs2_t val )
1999-12-23 05:01:37 +03:00
{
2000-04-15 11:14:40 +04:00
return map_table_upper ( val ) ;
1999-12-23 05:01:37 +03:00
}
/*******************************************************************
Convert a wchar to lower case .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
1999-12-29 05:00:38 +03:00
smb_ucs2_t tolower_w ( smb_ucs2_t val )
1999-12-23 05:01:37 +03:00
{
2000-04-15 11:14:40 +04:00
return map_table_lower ( val ) ;
1999-12-23 05:01:37 +03:00
}
1999-12-29 05:00:38 +03:00
static smb_ucs2_t * last_ptr = NULL ;
void set_first_token_w ( smb_ucs2_t * ptr )
{
last_ptr = ptr ;
}
/****************************************************************************
Get the next token from a string , return False if none found
handles double - quotes .
Based on a routine by GJC @ VILLAGE . COM .
Extensively modified by Andrew . Tridgell @ anu . edu . au
bufsize is in bytes .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
static smb_ucs2_t sep_list [ ] = { ( smb_ucs2_t ) ' ' , ( smb_ucs2_t ) ' \t ' , ( smb_ucs2_t ) ' \n ' , ( smb_ucs2_t ) ' \r ' , 0 } ;
static smb_ucs2_t quotechar = ( smb_ucs2_t ) ' \" ' ;
BOOL next_token_w ( smb_ucs2_t * * ptr , smb_ucs2_t * buff , smb_ucs2_t * sep , size_t bufsize )
{
smb_ucs2_t * s ;
BOOL quoted ;
size_t len = 1 ;
/*
* Convert bufsize to smb_ucs2_t units .
*/
bufsize / = sizeof ( smb_ucs2_t ) ;
if ( ! ptr )
ptr = & last_ptr ;
if ( ! ptr )
return ( False ) ;
s = * ptr ;
/*
* Default to simple separators .
*/
if ( ! sep )
sep = sep_list ;
/*
* Find the first non sep char .
*/
while ( * s & & strchr_w ( sep , * s ) )
s + + ;
/*
* Nothing left ?
*/
if ( ! * s )
return ( False ) ;
/*
* Copy over the token .
*/
for ( quoted = False ; len < bufsize & & * s & & ( quoted | | ! strchr_w ( sep , * s ) ) ; s + + ) {
if ( * s = = quotechar ) {
quoted = ! quoted ;
} else {
len + + ;
* buff + + = * s ;
}
}
* ptr = ( * s ) ? s + 1 : s ;
* buff = 0 ;
last_ptr = * ptr ;
return ( True ) ;
}
/****************************************************************************
Convert list of tokens to array ; dependent on above routine .
Uses last_ptr from above - bit of a hack .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * * toktocliplist_w ( int * ctok , smb_ucs2_t * sep )
{
smb_ucs2_t * s = last_ptr ;
int ictok = 0 ;
smb_ucs2_t * * ret , * * iret ;
if ( ! sep )
sep = sep_list ;
while ( * s & & strchr_w ( sep , * s ) )
s + + ;
/*
* Nothing left ?
*/
if ( ! * s )
return ( NULL ) ;
do {
ictok + + ;
while ( * s & & ( ! strchr_w ( sep , * s ) ) )
s + + ;
while ( * s & & strchr_w ( sep , * s ) )
* s + + = 0 ;
} while ( * s ) ;
* ctok = ictok ;
s = last_ptr ;
if ( ! ( ret = iret = malloc ( ictok * sizeof ( smb_ucs2_t * ) ) ) )
return NULL ;
while ( ictok - - ) {
* iret + + = s ;
while ( * s + + )
;
while ( ! * s )
s + + ;
}
return ret ;
}
/*******************************************************************
Case insensitive string compararison .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
int StrCaseCmp_w ( const smb_ucs2_t * s , const smb_ucs2_t * t )
{
/*
* Compare until we run out of string , either t or s , or find a difference .
*/
while ( * s & & * t & & toupper_w ( * s ) = = toupper_w ( * t ) ) {
s + + ;
t + + ;
}
return ( toupper_w ( * s ) - toupper_w ( * t ) ) ;
}
/*******************************************************************
Case insensitive string compararison , length limited .
2000-03-22 22:03:12 +03:00
n is in ucs2 units .
1999-12-29 05:00:38 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
int StrnCaseCmp_w ( const smb_ucs2_t * s , const smb_ucs2_t * t , size_t n )
{
/*
* Compare until we run out of string , either t or s , or chars .
*/
while ( n & & * s & & * t & & toupper_w ( * s ) = = toupper_w ( * t ) ) {
s + + ;
t + + ;
n - - ;
}
/*
* Not run out of chars - strings are different lengths .
*/
if ( n )
return ( toupper_w ( * s ) - toupper_w ( * t ) ) ;
/*
* Identical up to where we run out of chars ,
* and strings are same length .
*/
return ( 0 ) ;
}
/*******************************************************************
Compare 2 strings .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL strequal_w ( const smb_ucs2_t * s1 , const smb_ucs2_t * s2 )
{
if ( s1 = = s2 )
return ( True ) ;
if ( ! s1 | | ! s2 )
return ( False ) ;
return ( StrCaseCmp_w ( s1 , s2 ) = = 0 ) ;
}
/*******************************************************************
2000-03-22 22:03:12 +03:00
Compare 2 strings up to and including the nth char . n is in ucs2
units .
1999-12-29 05:00:38 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL strnequal_w ( const smb_ucs2_t * s1 , const smb_ucs2_t * s2 , size_t n )
{
if ( s1 = = s2 )
return ( True ) ;
if ( ! s1 | | ! s2 | | ! n )
return ( False ) ;
return ( StrnCaseCmp_w ( s1 , s2 , n ) = = 0 ) ;
}
/*******************************************************************
Compare 2 strings ( case sensitive ) .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL strcsequal_w ( const smb_ucs2_t * s1 , const smb_ucs2_t * s2 )
{
if ( s1 = = s2 )
return ( True ) ;
if ( ! s1 | | ! s2 )
return ( False ) ;
return ( strcmp_w ( s1 , s2 ) = = 0 ) ;
}
/*******************************************************************
Convert a string to lower case .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void strlower_w ( smb_ucs2_t * s )
{
while ( * s ) {
if ( isupper_w ( * s ) )
* s = tolower_w ( * s ) ;
s + + ;
}
}
/*******************************************************************
Convert a string to upper case .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void strupper_w ( smb_ucs2_t * s )
{
while ( * s ) {
if ( islower_w ( * s ) )
* s = toupper_w ( * s ) ;
s + + ;
}
}
/*******************************************************************
Convert a string to " normal " form .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void strnorm_w ( smb_ucs2_t * s )
{
extern int case_default ;
if ( case_default = = CASE_UPPER )
strupper_w ( s ) ;
else
strlower_w ( s ) ;
}
/*******************************************************************
Check if a string is in " normal " case .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL strisnormal_w ( smb_ucs2_t * s )
{
extern int case_default ;
if ( case_default = = CASE_UPPER )
return ( ! strhaslower_w ( s ) ) ;
return ( ! strhasupper_w ( s ) ) ;
}
/****************************************************************************
String replace .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void string_replace_w ( smb_ucs2_t * s , smb_ucs2_t oldc , smb_ucs2_t newc )
{
while ( * s ) {
if ( oldc = = * s )
* s = newc ;
s + + ;
}
}
/*******************************************************************
Skip past some strings in a buffer . n is in bytes .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * skip_string_w ( smb_ucs2_t * buf , size_t n )
{
while ( n - - )
buf + = ( strlen_w ( buf ) * sizeof ( smb_ucs2_t ) ) + 1 ;
return ( buf ) ;
}
/*******************************************************************
Count the number of characters in a string . Same as strlen_w in
smb_ucs2_t string units .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
size_t str_charnum_w ( const smb_ucs2_t * s )
{
return strlen_w ( s ) ;
}
/*******************************************************************
Trim the specified elements off the front and back of a string .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL trim_string_w ( smb_ucs2_t * s , const smb_ucs2_t * front , const smb_ucs2_t * back )
{
BOOL ret = False ;
size_t front_len = ( front & & * front ) ? strlen_w ( front ) : 0 ;
size_t back_len = ( back & & * back ) ? strlen_w ( back ) : 0 ;
size_t s_len ;
while ( front_len & & strncmp_w ( s , front , front_len ) = = 0 ) {
smb_ucs2_t * p = s ;
ret = True ;
while ( 1 ) {
if ( ! ( * p = p [ front_len ] ) )
break ;
p + + ;
}
}
if ( back_len ) {
s_len = strlen_w ( s ) ;
while ( ( s_len > = back_len ) & &
( strncmp_w ( s + s_len - back_len , back , back_len ) = = 0 ) ) {
ret = True ;
s [ s_len - back_len ] = 0 ;
s_len = strlen_w ( s ) ;
}
}
return ( ret ) ;
}
/****************************************************************************
Does a string have any uppercase chars in it ?
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL strhasupper_w ( const smb_ucs2_t * s )
{
while ( * s ) {
if ( isupper_w ( * s ) )
return ( True ) ;
s + + ;
}
return ( False ) ;
}
/****************************************************************************
Does a string have any lowercase chars in it ?
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL strhaslower_w ( const smb_ucs2_t * s )
{
while ( * s ) {
if ( islower ( * s ) )
return ( True ) ;
s + + ;
}
return ( False ) ;
}
/****************************************************************************
Find the number of ' c ' chars in a string .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
size_t count_chars_w ( const smb_ucs2_t * s , smb_ucs2_t c )
{
size_t count = 0 ;
while ( * s ) {
if ( * s = = c )
count + + ;
s + + ;
}
return ( count ) ;
}
/*******************************************************************
Return True if a string consists only of one particular character .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL str_is_all_w ( const smb_ucs2_t * s , smb_ucs2_t c )
{
if ( s = = NULL )
return False ;
if ( ! * s )
return False ;
while ( * s ) {
if ( * s ! = c )
return False ;
s + + ;
}
return True ;
}
/*******************************************************************
Paranoid strcpy into a buffer of given length ( includes terminating
zero . Strips out all but ' a - Z0 - 9 ' and replaces with ' _ ' . Deliberately
does * NOT * check for multibyte characters . Don ' t change it !
2000-03-22 22:03:12 +03:00
maxlength is in ucs2 units .
1999-12-29 05:00:38 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * alpha_strcpy_w ( smb_ucs2_t * dest , const smb_ucs2_t * src , size_t maxlength )
{
size_t len , i ;
if ( ! dest ) {
DEBUG ( 0 , ( " ERROR: NULL dest in alpha_strcpy_w \n " ) ) ;
return NULL ;
}
if ( ! src ) {
* dest = 0 ;
return dest ;
}
len = strlen_w ( src ) ;
if ( len > = maxlength )
len = maxlength - 1 ;
for ( i = 0 ; i < len ; i + + ) {
smb_ucs2_t val = src [ i ] ;
if ( isupper_w ( val ) | | islower_w ( val ) | | isdigit_w ( val ) )
dest [ i ] = src [ i ] ;
else
dest [ i ] = ( smb_ucs2_t ) ' _ ' ;
}
dest [ i ] = 0 ;
return dest ;
}
/****************************************************************************
Like strncpy but always null terminates . Make sure there is room !
2000-03-22 22:03:12 +03:00
The variable n should always be one less than the available size and is in
ucs2 units .
1999-12-29 05:00:38 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * StrnCpy_w ( smb_ucs2_t * dest , const smb_ucs2_t * src , size_t n )
{
smb_ucs2_t * d = dest ;
if ( ! dest )
return ( NULL ) ;
if ( ! src ) {
* dest = 0 ;
return ( dest ) ;
}
while ( n - - & & ( * d + + = * src + + ) )
;
* d = 0 ;
return ( dest ) ;
}
/****************************************************************************
Like strncpy but copies up to the character marker . Always null terminates .
returns a pointer to the character marker in the source string ( src ) .
2000-03-22 22:03:12 +03:00
n is in ucs2 units .
1999-12-29 05:00:38 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * strncpyn_w ( smb_ucs2_t * dest , const smb_ucs2_t * src , size_t n , smb_ucs2_t c )
{
smb_ucs2_t * p ;
size_t str_len ;
p = strchr_w ( src , c ) ;
if ( p = = NULL ) {
fstring cval ;
smb_ucs2_t mbcval [ 2 ] ;
mbcval [ 0 ] = c ;
mbcval [ 1 ] = 0 ;
DEBUG ( 5 , ( " strncpyn_w: separator character (%s) not found \n " ,
unicode_to_unix ( cval , mbcval , sizeof ( cval ) ) ) ) ;
return NULL ;
}
2000-03-22 22:03:12 +03:00
str_len = PTR_DIFF ( p , src ) + 1 ;
1999-12-29 05:00:38 +03:00
safe_strcpy_w ( dest , src , MIN ( n , str_len ) ) ;
return p ;
}
/*************************************************************
Routine to get hex characters and turn them into a 16 byte array .
The array can be variable length , and any non - hex - numeric
characters are skipped . " 0xnn " or " 0Xnn " is specially catered
for . len is in bytes .
Valid examples : " 0A5D15 " ; " 0x15, 0x49, 0xa2 " ; " 59 \t a9 \t e3 \n "
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
static smb_ucs2_t hexprefix [ ] = { ( smb_ucs2_t ) ' 0 ' , ( smb_ucs2_t ) ' x ' , 0 } ;
static smb_ucs2_t hexchars [ ] = { ( smb_ucs2_t ) ' 0 ' , ( smb_ucs2_t ) ' 1 ' , ( smb_ucs2_t ) ' 2 ' , ( smb_ucs2_t ) ' 3 ' ,
( smb_ucs2_t ) ' 4 ' , ( smb_ucs2_t ) ' 5 ' , ( smb_ucs2_t ) ' 6 ' , ( smb_ucs2_t ) ' 7 ' ,
( smb_ucs2_t ) ' 8 ' , ( smb_ucs2_t ) ' 9 ' , ( smb_ucs2_t ) ' A ' , ( smb_ucs2_t ) ' B ' ,
( smb_ucs2_t ) ' C ' , ( smb_ucs2_t ) ' D ' , ( smb_ucs2_t ) ' E ' , ( smb_ucs2_t ) ' F ' , 0 } ;
size_t strhex_to_str_w ( char * p , size_t len , const smb_ucs2_t * strhex )
{
size_t i ;
size_t num_chars = 0 ;
unsigned char lonybble , hinybble ;
smb_ucs2_t * p1 = NULL , * p2 = NULL ;
/*
* Convert to smb_ucs2_t units .
*/
len / = sizeof ( smb_ucs2_t ) ;
for ( i = 0 ; i < len & & strhex [ i ] ! = 0 ; i + + ) {
if ( strnequal_w ( hexchars , hexprefix , 2 ) ) {
i + + ; /* skip two chars */
continue ;
}
if ( ! ( p1 = strchr_w ( hexchars , toupper_w ( strhex [ i ] ) ) ) )
break ;
i + + ; /* next hex digit */
if ( ! ( p2 = strchr_w ( hexchars , toupper_w ( strhex [ i ] ) ) ) )
break ;
/* get the two nybbles */
hinybble = ( PTR_DIFF ( p1 , hexchars ) / sizeof ( smb_ucs2_t ) ) ;
lonybble = ( PTR_DIFF ( p2 , hexchars ) / sizeof ( smb_ucs2_t ) ) ;
p [ num_chars ] = ( hinybble < < 4 ) | lonybble ;
num_chars + + ;
p1 = NULL ;
p2 = NULL ;
}
return num_chars ;
}
/****************************************************************************
Check if a string is part of a list .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL in_list_w ( smb_ucs2_t * s , smb_ucs2_t * list , BOOL casesensitive )
{
wpstring tok ;
smb_ucs2_t * p = list ;
if ( ! list )
return ( False ) ;
while ( next_token_w ( & p , tok , LIST_SEP_W , sizeof ( tok ) ) ) {
if ( casesensitive ) {
if ( strcmp_w ( tok , s ) = = 0 )
return ( True ) ;
} else {
if ( StrCaseCmp_w ( tok , s ) = = 0 )
return ( True ) ;
}
}
return ( False ) ;
}
/* This is used to prevent lots of mallocs of size 2 */
static smb_ucs2_t * null_string = NULL ;
/****************************************************************************
Set a string value , allocing the space for the string .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL string_init_w ( smb_ucs2_t * * dest , const smb_ucs2_t * src )
{
size_t l ;
if ( ! null_string ) {
if ( ( null_string = ( smb_ucs2_t * ) malloc ( sizeof ( smb_ucs2_t ) ) ) = = NULL ) {
DEBUG ( 0 , ( " string_init_w: malloc fail for null_string. \n " ) ) ;
return False ;
}
* null_string = 0 ;
}
if ( ! src )
src = null_string ;
l = strlen_w ( src ) ;
if ( l = = 0 )
* dest = null_string ;
else {
( * dest ) = ( smb_ucs2_t * ) malloc ( sizeof ( smb_ucs2_t ) * ( l + 1 ) ) ;
if ( ( * dest ) = = NULL ) {
DEBUG ( 0 , ( " Out of memory in string_init_w \n " ) ) ;
return False ;
}
wpstrcpy ( * dest , src ) ;
}
return ( True ) ;
}
/****************************************************************************
Free a string value .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void string_free_w ( smb_ucs2_t * * s )
{
if ( ! s | | ! ( * s ) )
return ;
if ( * s = = null_string )
* s = NULL ;
if ( * s )
free ( ( char * ) * s ) ;
* s = NULL ;
}
/****************************************************************************
Set a string value , allocing the space for the string , and deallocating any
existing space .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
BOOL string_set_w ( smb_ucs2_t * * dest , const smb_ucs2_t * src )
{
string_free_w ( dest ) ;
return ( string_init_w ( dest , src ) ) ;
}
/****************************************************************************
Substitute a string for a pattern in another string . Make sure there is
enough room !
This routine looks for pattern in s and replaces it with
insert . It may do multiple replacements .
Any of " ; ' $ or ` in the insert string are replaced with _
if len = = 0 then no length check is performed
2000-03-22 22:03:12 +03:00
len is in ucs2 units .
1999-12-29 05:00:38 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void string_sub_w ( smb_ucs2_t * s , const smb_ucs2_t * pattern , const smb_ucs2_t * insert , size_t len )
{
smb_ucs2_t * p ;
ssize_t ls , lp , li , i ;
if ( ! insert | | ! pattern | | ! s )
return ;
ls = ( ssize_t ) strlen_w ( s ) ;
lp = ( ssize_t ) strlen_w ( pattern ) ;
li = ( ssize_t ) strlen_w ( insert ) ;
if ( ! * pattern )
return ;
while ( lp < = ls & & ( p = strstr_w ( s , pattern ) ) ) {
if ( len & & ( ls + ( li - lp ) > = len ) ) {
fstring out ;
DEBUG ( 0 , ( " ERROR: string overflow by %d in string_sub_w(%.50s, %d) \n " ,
( int ) ( sizeof ( smb_ucs2_t ) * ( ls + ( li - lp ) - len ) ) ,
unicode_to_unix ( out , pattern , sizeof ( out ) ) , ( int ) len * sizeof ( smb_ucs2_t ) ) ) ;
break ;
}
if ( li ! = lp )
memmove ( p + li , p + lp , sizeof ( smb_ucs2_t ) * ( strlen_w ( p + lp ) + 1 ) ) ;
for ( i = 0 ; i < li ; i + + ) {
switch ( insert [ i ] ) {
case ( smb_ucs2_t ) ' ` ' :
case ( smb_ucs2_t ) ' " ' :
case ( smb_ucs2_t ) ' \' ' :
case ( smb_ucs2_t ) ' ; ' :
case ( smb_ucs2_t ) ' $ ' :
case ( smb_ucs2_t ) ' % ' :
case ( smb_ucs2_t ) ' \r ' :
case ( smb_ucs2_t ) ' \n ' :
p [ i ] = ( smb_ucs2_t ) ' _ ' ;
break ;
default :
p [ i ] = insert [ i ] ;
}
}
s = p + li ;
ls + = ( li - lp ) ;
}
}
void fstring_sub_w ( smb_ucs2_t * s , const smb_ucs2_t * pattern , const smb_ucs2_t * insert )
{
string_sub_w ( s , pattern , insert , sizeof ( wfstring ) ) ;
}
void pstring_sub_w ( smb_ucs2_t * s , const smb_ucs2_t * pattern , smb_ucs2_t * insert )
{
string_sub_w ( s , pattern , insert , sizeof ( wpstring ) ) ;
}
/****************************************************************************
Similar to string_sub ( ) but allows for any character to be substituted .
Use with caution !
if len = = 0 then no length check is performed .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void all_string_sub_w ( smb_ucs2_t * s , const smb_ucs2_t * pattern , const smb_ucs2_t * insert , size_t len )
{
smb_ucs2_t * p ;
ssize_t ls , lp , li ;
if ( ! insert | | ! pattern | | ! s )
return ;
ls = ( ssize_t ) strlen_w ( s ) ;
lp = ( ssize_t ) strlen_w ( pattern ) ;
li = ( ssize_t ) strlen_w ( insert ) ;
if ( ! * pattern )
return ;
while ( lp < = ls & & ( p = strstr_w ( s , pattern ) ) ) {
if ( len & & ( ls + ( li - lp ) > = len ) ) {
fstring out ;
DEBUG ( 0 , ( " ERROR: string overflow by %d in all_string_sub_w(%.50s, %d) \n " ,
( int ) ( sizeof ( smb_ucs2_t ) * ( ls + ( li - lp ) - len ) ) ,
unicode_to_unix ( out , pattern , sizeof ( out ) ) , ( int ) len * sizeof ( smb_ucs2_t ) ) ) ;
break ;
}
if ( li ! = lp )
memmove ( p + li , p + lp , sizeof ( smb_ucs2_t ) * ( strlen_w ( p + lp ) + 1 ) ) ;
memcpy ( p , insert , li * sizeof ( smb_ucs2_t ) ) ;
s = p + li ;
ls + = ( li - lp ) ;
}
}
/****************************************************************************
Splits out the front and back at a separator .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
void split_at_last_component_w ( smb_ucs2_t * path , smb_ucs2_t * front , smb_ucs2_t sep , smb_ucs2_t * back )
{
smb_ucs2_t * p = strrchr_w ( path , sep ) ;
if ( p ! = NULL )
* p = 0 ;
if ( front ! = NULL )
wpstrcpy ( front , path ) ;
if ( p ! = NULL ) {
if ( back ! = NULL )
wpstrcpy ( back , p + 1 ) ;
* p = ( smb_ucs2_t ) ' \\ ' ;
} else {
if ( back ! = NULL )
back [ 0 ] = 0 ;
}
}
/****************************************************************************
Write an octal as a string .
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * octal_string_w ( int i )
{
static smb_ucs2_t wret [ 64 ] ;
char ret [ 64 ] ;
if ( i = = - 1 )
slprintf ( ret , sizeof ( ret ) , " -1 " ) ;
else
slprintf ( ret , sizeof ( ret ) , " 0%o " , i ) ;
return unix_to_unicode ( wret , ret , sizeof ( wret ) ) ;
}
/****************************************************************************
Truncate a string at a specified length .
2000-03-22 22:03:12 +03:00
length is in ucs2 units .
1999-12-29 05:00:38 +03:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t * string_truncate_w ( smb_ucs2_t * s , size_t length )
{
if ( s & & strlen_w ( s ) > length )
s [ length ] = 0 ;
return s ;
}
2000-10-03 06:12:14 +04:00
/******************************************************************
functions for UTF8 support ( using in kanji . c )
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
smb_ucs2_t doscp2ucs2 ( int w )
{
return ( ( smb_ucs2_t ) doscp_to_ucs2 [ w ] ) ;
}
int ucs2doscp ( smb_ucs2_t w )
{
return ( ( int ) ucs2_to_doscp [ w ] ) ;
}