1996-05-04 11:50:46 +04:00
/*
2002-01-30 09:08:46 +03:00
Unix SMB / CIFS implementation .
1996-05-04 11:50:46 +04:00
Character set conversion Extensions
2001-07-04 11:15:53 +04:00
Copyright ( C ) Igor Vergeichik < iverg @ mail . ru > 2001
Copyright ( C ) Andrew Tridgell 2001
2001-11-12 03:53:34 +03:00
Copyright ( C ) Simo Sorce 2001
1996-05-04 11:50:46 +04:00
This program is free software ; you can redistribute it and / or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation ; either version 2 of the License , or
( at your option ) any later version .
This program is distributed in the hope that it will be useful ,
but WITHOUT ANY WARRANTY ; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE . See the
GNU General Public License for more details .
You should have received a copy of the GNU General Public License
along with this program ; if not , write to the Free Software
Foundation , Inc . , 675 Mass Ave , Cambridge , MA 0213 9 , USA .
*/
# include "includes.h"
2001-07-04 11:15:53 +04:00
2003-02-24 06:09:08 +03:00
/**
* @ file
*
2003-02-24 07:49:10 +03:00
* @ brief Character - set conversion routines built on our iconv .
*
* @ note Samba ' s internal character set ( at least in the 3.0 series )
* is always the same as the one for the Unix filesystem . It is
* < b > not < / b > necessarily UTF - 8 and may be different on machines that
* need i18n filenames to be compatible with Unix software . It does
* have to be a superset of ASCII . All multibyte sequences must start
* with a byte with the high bit set .
2003-02-24 06:09:08 +03:00
*
* @ sa lib / iconv . c
2003-02-24 07:49:10 +03:00
*/
static pstring cvtbuf ;
static smb_iconv_t conv_handles [ NUM_CHARSETS ] [ NUM_CHARSETS ] ;
2003-02-24 06:09:08 +03:00
2002-11-12 01:13:05 +03:00
2003-02-24 06:09:08 +03:00
/**
* Return the name of a charset to give to iconv ( ) .
* */
2003-01-03 11:28:12 +03:00
static const char * charset_name ( charset_t ch )
2001-09-07 18:14:57 +04:00
{
2003-01-03 11:28:12 +03:00
const char * ret = NULL ;
2001-09-07 18:14:57 +04:00
if ( ch = = CH_UCS2 ) ret = " UCS-2LE " ;
else if ( ch = = CH_UNIX ) ret = lp_unix_charset ( ) ;
else if ( ch = = CH_DOS ) ret = lp_dos_charset ( ) ;
else if ( ch = = CH_DISPLAY ) ret = lp_display_charset ( ) ;
2002-03-01 03:57:47 +03:00
else if ( ch = = CH_UTF8 ) ret = " UTF8 " ;
2001-09-07 18:14:57 +04:00
if ( ! ret | | ! * ret ) ret = " ASCII " ;
return ret ;
}
1996-05-04 11:50:46 +04:00
2002-01-22 06:51:28 +03:00
static void lazy_initialize_conv ( void )
{
static int initialized = False ;
if ( ! initialized ) {
initialized = True ;
load_case_tables ( ) ;
init_iconv ( ) ;
}
}
2003-02-24 06:09:08 +03:00
/**
2003-04-04 11:50:59 +04:00
* Initialize iconv conversion descriptors .
*
* This is called the first time it is needed , and also called again
* every time the configuration is reloaded , because the charset or
* codepage might have changed .
* */
2001-09-07 18:14:57 +04:00
void init_iconv ( void )
2001-07-04 11:15:53 +04:00
{
2001-09-07 18:14:57 +04:00
int c1 , c2 ;
2001-12-20 09:18:52 +03:00
BOOL did_reload = False ;
2001-09-07 18:14:57 +04:00
/* so that charset_name() works we need to get the UNIX<->UCS2 going
first */
2002-11-12 01:13:05 +03:00
if ( ! conv_handles [ CH_UNIX ] [ CH_UCS2 ] )
2001-09-07 18:14:57 +04:00
conv_handles [ CH_UNIX ] [ CH_UCS2 ] = smb_iconv_open ( " UCS-2LE " , " ASCII " ) ;
2002-11-12 01:13:05 +03:00
if ( ! conv_handles [ CH_UCS2 ] [ CH_UNIX ] )
2001-09-07 18:14:57 +04:00
conv_handles [ CH_UCS2 ] [ CH_UNIX ] = smb_iconv_open ( " ASCII " , " UCS-2LE " ) ;
2001-07-04 11:15:53 +04:00
2001-09-07 18:14:57 +04:00
for ( c1 = 0 ; c1 < NUM_CHARSETS ; c1 + + ) {
for ( c2 = 0 ; c2 < NUM_CHARSETS ; c2 + + ) {
2003-01-03 11:28:12 +03:00
const char * n1 = charset_name ( ( charset_t ) c1 ) ;
const char * n2 = charset_name ( ( charset_t ) c2 ) ;
2001-12-20 09:18:52 +03:00
if ( conv_handles [ c1 ] [ c2 ] & &
strcmp ( n1 , conv_handles [ c1 ] [ c2 ] - > from_name ) = = 0 & &
2002-11-12 01:13:05 +03:00
strcmp ( n2 , conv_handles [ c1 ] [ c2 ] - > to_name ) = = 0 )
continue ;
2001-12-20 09:18:52 +03:00
did_reload = True ;
2002-11-12 01:13:05 +03:00
if ( conv_handles [ c1 ] [ c2 ] )
2001-09-07 18:14:57 +04:00
smb_iconv_close ( conv_handles [ c1 ] [ c2 ] ) ;
2002-11-12 01:13:05 +03:00
2001-09-07 18:14:57 +04:00
conv_handles [ c1 ] [ c2 ] = smb_iconv_open ( n2 , n1 ) ;
if ( conv_handles [ c1 ] [ c2 ] = = ( smb_iconv_t ) - 1 ) {
DEBUG ( 0 , ( " Conversion from %s to %s not supported \n " ,
2001-10-23 23:10:30 +04:00
charset_name ( ( charset_t ) c1 ) , charset_name ( ( charset_t ) c2 ) ) ) ;
2001-09-07 18:14:57 +04:00
conv_handles [ c1 ] [ c2 ] = NULL ;
}
}
}
2001-12-20 09:18:52 +03:00
if ( did_reload ) {
init_valid_table ( ) ;
}
2001-07-04 11:15:53 +04:00
}
1996-05-04 11:50:46 +04:00
2001-11-23 07:24:26 +03:00
/**
* Convert string from one encoding to another , making error checking etc
*
* @ param src pointer to source string ( multibyte or singlebyte )
* @ param srclen length of the source string in bytes
* @ param dest pointer to destination string ( multibyte or singlebyte )
* @ param destlen maximal length allowed for string
2003-02-24 06:09:08 +03:00
* @ returns the number of bytes occupied in the destination
2001-11-23 07:24:26 +03:00
* */
2001-09-07 18:14:57 +04:00
size_t convert_string ( charset_t from , charset_t to ,
void const * src , size_t srclen ,
void * dest , size_t destlen )
2001-07-04 11:15:53 +04:00
{
size_t i_len , o_len ;
size_t retval ;
2001-11-29 02:54:07 +03:00
const char * inbuf = ( const char * ) src ;
2001-07-04 11:15:53 +04:00
char * outbuf = ( char * ) dest ;
2001-09-07 18:14:57 +04:00
smb_iconv_t descriptor ;
2002-11-12 01:13:05 +03:00
if ( srclen = = ( size_t ) - 1 )
srclen = strlen ( src ) + 1 ;
2001-09-24 10:24:14 +04:00
2002-01-22 06:51:28 +03:00
lazy_initialize_conv ( ) ;
2001-07-04 11:15:53 +04:00
2001-09-07 18:14:57 +04:00
descriptor = conv_handles [ from ] [ to ] ;
if ( descriptor = = ( smb_iconv_t ) - 1 | | descriptor = = ( smb_iconv_t ) 0 ) {
2001-07-04 11:15:53 +04:00
/* conversion not supported, use as is */
2002-11-12 01:13:05 +03:00
size_t len = MIN ( srclen , destlen ) ;
2001-07-04 11:15:53 +04:00
memcpy ( dest , src , len ) ;
return len ;
}
i_len = srclen ;
o_len = destlen ;
2001-11-23 07:53:56 +03:00
retval = smb_iconv ( descriptor , & inbuf , & i_len , & outbuf , & o_len ) ;
2003-02-01 10:25:53 +03:00
if ( retval = = ( size_t ) - 1 ) {
2003-01-03 11:28:12 +03:00
const char * reason = " unknown error " ;
2002-11-12 01:13:05 +03:00
switch ( errno ) {
case EINVAL :
reason = " Incomplete multibyte sequence " ;
break ;
case E2BIG :
reason = " No more room " ;
DEBUG ( 0 , ( " convert_string: Required %d, available %d \n " ,
srclen , destlen ) ) ;
/* we are not sure we need srclen bytes,
2001-11-04 21:26:53 +03:00
may be more , may be less .
We only know we need more than destlen
bytes - - - simo */
2001-07-04 11:15:53 +04:00
break ;
2002-11-12 01:13:05 +03:00
case EILSEQ :
reason = " Illegal multibyte sequence " ;
break ;
2001-07-04 11:15:53 +04:00
}
/* smb_panic(reason); */
}
return destlen - o_len ;
}
1996-05-04 11:50:46 +04:00
2001-11-23 07:24:26 +03:00
/**
* Convert between character sets , allocating a new buffer for the result .
*
* @ param srclen length of source buffer .
2002-03-23 11:39:04 +03:00
* @ param dest always set at least to NULL
2001-11-23 07:24:26 +03:00
* @ note - 1 is not accepted for srclen .
*
2003-02-24 06:09:08 +03:00
* @ returns Size in bytes of the converted string ; or - 1 in case of error .
2001-11-23 07:24:26 +03:00
* */
2002-11-12 01:13:05 +03:00
2003-03-20 19:44:14 +03:00
size_t convert_string_allocate ( charset_t from , charset_t to ,
2001-11-07 21:14:46 +03:00
void const * src , size_t srclen , void * * dest )
{
size_t i_len , o_len , destlen ;
size_t retval ;
2001-11-29 02:54:07 +03:00
const char * inbuf = ( const char * ) src ;
2001-11-07 21:14:46 +03:00
char * outbuf , * ob ;
smb_iconv_t descriptor ;
* dest = NULL ;
2002-11-12 01:13:05 +03:00
if ( src = = NULL | | srclen = = ( size_t ) - 1 )
return ( size_t ) - 1 ;
2001-11-07 21:14:46 +03:00
2002-01-22 06:51:28 +03:00
lazy_initialize_conv ( ) ;
2001-11-07 21:14:46 +03:00
descriptor = conv_handles [ from ] [ to ] ;
if ( descriptor = = ( smb_iconv_t ) - 1 | | descriptor = = ( smb_iconv_t ) 0 ) {
/* conversion not supported, return -1*/
2002-02-04 03:59:23 +03:00
DEBUG ( 3 , ( " convert_string_allocate: conversion not supported! \n " ) ) ;
2001-11-07 21:14:46 +03:00
return - 1 ;
}
2001-11-10 18:21:54 +03:00
destlen = MAX ( srclen , 512 ) ;
2001-11-07 21:14:46 +03:00
outbuf = NULL ;
convert :
destlen = destlen * 2 ;
ob = ( char * ) realloc ( outbuf , destlen ) ;
if ( ! ob ) {
DEBUG ( 0 , ( " convert_string_allocate: realloc failed! \n " ) ) ;
2001-11-12 03:53:34 +03:00
SAFE_FREE ( outbuf ) ;
2002-11-12 01:13:05 +03:00
return ( size_t ) - 1 ;
2001-11-07 21:14:46 +03:00
}
2002-11-12 01:13:05 +03:00
else
outbuf = ob ;
2001-11-07 21:14:46 +03:00
i_len = srclen ;
o_len = destlen ;
retval = smb_iconv ( descriptor ,
2001-11-23 07:53:56 +03:00
& inbuf , & i_len ,
2001-11-23 07:24:26 +03:00
& outbuf , & o_len ) ;
2003-02-01 10:25:53 +03:00
if ( retval = = ( size_t ) - 1 ) {
2003-01-03 11:28:12 +03:00
const char * reason = " unknown error " ;
2002-11-12 01:13:05 +03:00
switch ( errno ) {
case EINVAL :
reason = " Incomplete multibyte sequence " ;
break ;
case E2BIG :
goto convert ;
case EILSEQ :
reason = " Illegal multibyte sequence " ;
break ;
2001-11-07 21:14:46 +03:00
}
DEBUG ( 0 , ( " Conversion error: %s(%s) \n " , reason , inbuf ) ) ;
/* smb_panic(reason); */
2002-11-12 01:13:05 +03:00
return ( size_t ) - 1 ;
2001-11-07 21:14:46 +03:00
}
destlen = destlen - o_len ;
2001-11-12 04:31:43 +03:00
* dest = ( char * ) Realloc ( ob , destlen ) ;
2001-11-07 21:14:46 +03:00
if ( ! * dest ) {
DEBUG ( 0 , ( " convert_string_allocate: out of memory! \n " ) ) ;
2001-11-12 03:53:34 +03:00
SAFE_FREE ( ob ) ;
2002-11-12 01:13:05 +03:00
return ( size_t ) - 1 ;
2001-11-07 21:14:46 +03:00
}
2001-11-10 18:21:54 +03:00
2001-11-07 21:14:46 +03:00
return destlen ;
}
2003-02-24 06:09:08 +03:00
2002-03-23 11:39:04 +03:00
/**
* Convert between character sets , allocating a new buffer using talloc for the result .
*
* @ param srclen length of source buffer .
* @ param dest always set at least to NULL
* @ note - 1 is not accepted for srclen .
*
2003-02-24 06:09:08 +03:00
* @ returns Size in bytes of the converted string ; or - 1 in case of error .
2002-03-23 11:39:04 +03:00
* */
2003-03-18 04:48:11 +03:00
static size_t convert_string_talloc ( TALLOC_CTX * ctx , charset_t from , charset_t to ,
2002-03-23 11:39:04 +03:00
void const * src , size_t srclen , void * * dest )
{
2002-08-17 21:00:51 +04:00
void * alloced_string ;
2002-03-23 11:39:04 +03:00
size_t dest_len ;
* dest = NULL ;
2002-08-17 21:00:51 +04:00
dest_len = convert_string_allocate ( from , to , src , srclen , & alloced_string ) ;
2002-11-12 01:13:05 +03:00
if ( dest_len = = ( size_t ) - 1 )
return ( size_t ) - 1 ;
2002-08-17 21:00:51 +04:00
* dest = talloc_memdup ( ctx , alloced_string , dest_len ) ;
SAFE_FREE ( alloced_string ) ;
2002-03-23 11:39:04 +03:00
if ( * dest = = NULL )
2002-11-12 01:13:05 +03:00
return ( size_t ) - 1 ;
2002-03-23 11:39:04 +03:00
return dest_len ;
}
2002-11-12 01:13:05 +03:00
size_t unix_strupper ( const char * src , size_t srclen , char * dest , size_t destlen )
2001-07-04 11:15:53 +04:00
{
2002-11-12 01:13:05 +03:00
size_t size ;
2001-07-04 11:15:53 +04:00
smb_ucs2_t * buffer = ( smb_ucs2_t * ) cvtbuf ;
2001-09-07 18:14:57 +04:00
size = convert_string ( CH_UNIX , CH_UCS2 , src , srclen , buffer , sizeof ( cvtbuf ) ) ;
2002-11-12 01:13:05 +03:00
if ( ! strupper_w ( buffer ) & & ( dest = = src ) )
return srclen ;
2001-09-07 18:14:57 +04:00
return convert_string ( CH_UCS2 , CH_UNIX , buffer , size , dest , destlen ) ;
2001-07-04 11:15:53 +04:00
}
1996-05-04 11:50:46 +04:00
2002-11-12 01:13:05 +03:00
size_t unix_strlower ( const char * src , size_t srclen , char * dest , size_t destlen )
2001-07-04 11:15:53 +04:00
{
2002-11-12 01:13:05 +03:00
size_t size ;
2001-07-04 11:15:53 +04:00
smb_ucs2_t * buffer = ( smb_ucs2_t * ) cvtbuf ;
2001-09-07 18:14:57 +04:00
size = convert_string ( CH_UNIX , CH_UCS2 , src , srclen , buffer , sizeof ( cvtbuf ) ) ;
2002-11-12 01:13:05 +03:00
if ( ! strlower_w ( buffer ) & & ( dest = = src ) )
return srclen ;
2001-09-07 18:14:57 +04:00
return convert_string ( CH_UCS2 , CH_UNIX , buffer , size , dest , destlen ) ;
1996-05-04 11:50:46 +04:00
}
2003-03-18 04:48:11 +03:00
static size_t ucs2_align ( const void * base_ptr , const void * p , int flags )
2001-07-04 11:15:53 +04:00
{
2002-11-12 01:13:05 +03:00
if ( flags & ( STR_NOALIGN | STR_ASCII ) )
return 0 ;
2001-07-04 11:15:53 +04:00
return PTR_DIFF ( p , base_ptr ) & 1 ;
1996-05-04 11:50:46 +04:00
}
2001-07-04 11:15:53 +04:00
2003-02-24 06:09:08 +03:00
/**
* Copy a string from a char * unix src to a dos codepage string destination .
*
* @ return the number of bytes occupied by the string in the destination .
*
* @ param flags can include
* < dl >
* < dt > STR_TERMINATE < / dt > < dd > means include the null termination < / dd >
* < dt > STR_UPPER < / dt > < dd > means uppercase in the destination < / dd >
* < / dl >
*
* @ param dest_len the maximum length in bytes allowed in the
* destination . If @ p dest_len is - 1 then no maximum is used .
* */
2002-11-12 01:13:05 +03:00
size_t push_ascii ( void * dest , const char * src , size_t dest_len , int flags )
1999-12-13 16:27:58 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) ;
2001-07-04 11:15:53 +04:00
pstring tmpbuf ;
1997-01-09 21:02:17 +03:00
2001-07-04 11:15:53 +04:00
/* treat a pstring as "unlimited" length */
2002-11-12 01:13:05 +03:00
if ( dest_len = = ( size_t ) - 1 )
2001-07-04 11:15:53 +04:00
dest_len = sizeof ( pstring ) ;
1996-05-04 11:50:46 +04:00
2001-07-04 11:15:53 +04:00
if ( flags & STR_UPPER ) {
pstrcpy ( tmpbuf , src ) ;
strupper ( tmpbuf ) ;
src = tmpbuf ;
}
2001-02-15 00:56:57 +03:00
2002-11-12 01:13:05 +03:00
if ( flags & STR_TERMINATE )
2001-07-04 11:15:53 +04:00
src_len + + ;
2001-09-07 18:14:57 +04:00
return convert_string ( CH_UNIX , CH_DOS , src , src_len , dest , dest_len ) ;
1997-05-09 01:17:59 +04:00
}
2002-11-12 01:13:05 +03:00
size_t push_ascii_fstring ( void * dest , const char * src )
2001-07-04 11:15:53 +04:00
{
return push_ascii ( dest , src , sizeof ( fstring ) , STR_TERMINATE ) ;
}
1998-01-17 10:08:21 +03:00
2002-11-12 01:13:05 +03:00
size_t push_ascii_pstring ( void * dest , const char * src )
2001-07-04 11:15:53 +04:00
{
return push_ascii ( dest , src , sizeof ( pstring ) , STR_TERMINATE ) ;
}
1998-01-17 10:08:21 +03:00
2003-02-24 06:09:08 +03:00
/**
* Copy a string from a dos codepage source to a unix char * destination .
*
* The resulting string in " dest " is always null terminated .
*
* @ param flags can have :
* < dl >
* < dt > STR_TERMINATE < / dt >
* < dd > STR_TERMINATE means the string in @ p src
* is null terminated , and src_len is ignored . < / dd >
* < / dl >
*
* @ param src_len is the length of the source area in bytes .
* @ returns the number of bytes occupied by the string in @ p src .
* */
2002-11-12 01:13:05 +03:00
size_t pull_ascii ( char * dest , const void * src , size_t dest_len , size_t src_len , int flags )
1999-12-13 16:27:58 +03:00
{
2002-11-12 01:13:05 +03:00
size_t ret ;
2001-07-04 11:15:53 +04:00
2002-11-12 01:13:05 +03:00
if ( dest_len = = ( size_t ) - 1 )
2001-07-04 11:15:53 +04:00
dest_len = sizeof ( pstring ) ;
2002-07-15 14:35:28 +04:00
if ( flags & STR_TERMINATE ) {
2002-11-12 01:13:05 +03:00
if ( src_len = = ( size_t ) - 1 ) {
2002-07-15 14:35:28 +04:00
src_len = strlen ( src ) + 1 ;
} else {
2002-11-12 01:13:05 +03:00
size_t len = strnlen ( src , src_len ) ;
if ( len < src_len )
len + + ;
2002-07-15 14:35:28 +04:00
src_len = len ;
}
}
2001-07-04 11:15:53 +04:00
2001-09-07 18:14:57 +04:00
ret = convert_string ( CH_DOS , CH_UNIX , src , src_len , dest , dest_len ) ;
2001-07-04 11:15:53 +04:00
2002-11-12 01:13:05 +03:00
if ( dest_len )
dest [ MIN ( ret , dest_len - 1 ) ] = 0 ;
2001-07-04 11:15:53 +04:00
return src_len ;
1998-01-17 10:08:21 +03:00
}
2002-11-12 01:13:05 +03:00
size_t pull_ascii_pstring ( char * dest , const void * src )
2001-07-04 11:15:53 +04:00
{
return pull_ascii ( dest , src , sizeof ( pstring ) , - 1 , STR_TERMINATE ) ;
}
2001-01-08 02:00:49 +03:00
2002-11-12 01:13:05 +03:00
size_t pull_ascii_fstring ( char * dest , const void * src )
2001-01-08 02:00:49 +03:00
{
2001-07-04 11:15:53 +04:00
return pull_ascii ( dest , src , sizeof ( fstring ) , - 1 , STR_TERMINATE ) ;
2001-01-08 02:00:49 +03:00
}
2003-02-24 06:09:08 +03:00
/**
* Copy a string from a char * src to a unicode destination .
*
* @ returns the number of bytes occupied by the string in the destination .
*
* @ param flags can have :
*
* < dl >
* < dt > STR_TERMINATE < dd > means include the null termination .
* < dt > STR_UPPER < dd > means uppercase in the destination .
* < dt > STR_NOALIGN < dd > means don ' t do alignment .
* < / dl >
*
* @ param dest_len is the maximum length allowed in the
* destination . If dest_len is - 1 then no maxiumum is used .
* */
2002-11-12 01:13:05 +03:00
size_t push_ucs2 ( const void * base_ptr , void * dest , const char * src , size_t dest_len , int flags )
2001-07-04 11:15:53 +04:00
{
2002-11-12 01:13:05 +03:00
size_t len = 0 ;
size_t src_len = strlen ( src ) ;
2001-07-04 11:15:53 +04:00
pstring tmpbuf ;
/* treat a pstring as "unlimited" length */
2002-11-12 01:13:05 +03:00
if ( dest_len = = ( size_t ) - 1 )
2001-07-04 11:15:53 +04:00
dest_len = sizeof ( pstring ) ;
if ( flags & STR_UPPER ) {
pstrcpy ( tmpbuf , src ) ;
strupper ( tmpbuf ) ;
src = tmpbuf ;
}
2002-11-12 01:13:05 +03:00
if ( flags & STR_TERMINATE )
2001-07-04 11:15:53 +04:00
src_len + + ;
if ( ucs2_align ( base_ptr , dest , flags ) ) {
* ( char * ) dest = 0 ;
dest = ( void * ) ( ( char * ) dest + 1 ) ;
if ( dest_len ) dest_len - - ;
len + + ;
}
2001-07-25 08:00:40 +04:00
/* ucs2 is always a multiple of 2 bytes */
dest_len & = ~ 1 ;
2001-09-07 18:14:57 +04:00
len + = convert_string ( CH_UNIX , CH_UCS2 , src , src_len , dest , dest_len ) ;
2001-07-04 11:15:53 +04:00
return len ;
2001-02-15 00:56:57 +03:00
}
2001-01-08 02:00:49 +03:00
2003-02-24 06:09:08 +03:00
2002-03-25 10:41:42 +03:00
/**
2003-02-24 06:09:08 +03:00
* Copy a string from a unix char * src to a UCS2 destination ,
* allocating a buffer using talloc ( ) .
2002-03-25 10:41:42 +03:00
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-09-25 19:19:00 +04:00
* or - 1 in case of error .
2002-03-25 10:41:42 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t push_ucs2_talloc ( TALLOC_CTX * ctx , smb_ucs2_t * * dest , const char * src )
2002-03-25 10:41:42 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) + 1 ;
2002-03-25 10:41:42 +03:00
* dest = NULL ;
2002-09-25 19:19:00 +04:00
return convert_string_talloc ( ctx , CH_UNIX , CH_UCS2 , src , src_len , ( void * * ) dest ) ;
2002-03-25 10:41:42 +03:00
}
2003-02-24 06:09:08 +03:00
2002-03-25 10:41:42 +03:00
/**
* Copy a string from a unix char * src to a UCS2 destination , allocating a buffer
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-09-25 19:19:00 +04:00
* or - 1 in case of error .
2002-03-25 10:41:42 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t push_ucs2_allocate ( smb_ucs2_t * * dest , const char * src )
2002-03-25 10:41:42 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) + 1 ;
2002-03-25 10:41:42 +03:00
* dest = NULL ;
2002-09-25 19:19:00 +04:00
return convert_string_allocate ( CH_UNIX , CH_UCS2 , src , src_len , ( void * * ) dest ) ;
2002-03-25 10:41:42 +03:00
}
2003-02-24 06:09:08 +03:00
/**
2002-11-12 01:13:05 +03:00
Copy a string from a char * src to a UTF - 8 destination .
Return the number of bytes occupied by the string in the destination
Flags can have :
2002-02-20 02:02:39 +03:00
STR_TERMINATE means include the null termination
STR_UPPER means uppercase in the destination
2002-11-12 01:13:05 +03:00
dest_len is the maximum length allowed in the destination . If dest_len
is - 1 then no maxiumum is used .
2003-02-24 06:09:08 +03:00
* */
2002-11-12 01:13:05 +03:00
2003-03-18 04:48:11 +03:00
static size_t push_utf8 ( void * dest , const char * src , size_t dest_len , int flags )
2002-02-20 02:02:39 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) ;
2002-02-20 02:02:39 +03:00
pstring tmpbuf ;
/* treat a pstring as "unlimited" length */
2002-11-12 01:13:05 +03:00
if ( dest_len = = ( size_t ) - 1 )
2002-02-20 02:02:39 +03:00
dest_len = sizeof ( pstring ) ;
if ( flags & STR_UPPER ) {
pstrcpy ( tmpbuf , src ) ;
strupper ( tmpbuf ) ;
src = tmpbuf ;
}
2002-11-12 01:13:05 +03:00
if ( flags & STR_TERMINATE )
2002-02-20 02:02:39 +03:00
src_len + + ;
return convert_string ( CH_UNIX , CH_UTF8 , src , src_len , dest , dest_len ) ;
}
1998-01-17 10:08:21 +03:00
2002-11-12 01:13:05 +03:00
size_t push_utf8_fstring ( void * dest , const char * src )
2002-03-01 04:11:02 +03:00
{
return push_utf8 ( dest , src , sizeof ( fstring ) , STR_TERMINATE ) ;
}
2002-03-23 11:39:04 +03:00
/**
* Copy a string from a unix char * src to a UTF - 8 destination , allocating a buffer using talloc
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-03-23 11:39:04 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t push_utf8_talloc ( TALLOC_CTX * ctx , char * * dest , const char * src )
2002-03-23 11:39:04 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) + 1 ;
2002-03-23 11:39:04 +03:00
* dest = NULL ;
2002-08-17 21:00:51 +04:00
return convert_string_talloc ( ctx , CH_UNIX , CH_UTF8 , src , src_len , ( void * * ) dest ) ;
2002-03-23 11:39:04 +03:00
}
/**
* Copy a string from a unix char * src to a UTF - 8 destination , allocating a buffer
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-03-23 11:39:04 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t push_utf8_allocate ( char * * dest , const char * src )
2002-03-23 11:39:04 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) + 1 ;
2002-03-23 11:39:04 +03:00
* dest = NULL ;
2002-10-01 22:26:00 +04:00
return convert_string_allocate ( CH_UNIX , CH_UTF8 , src , src_len , ( void * * ) dest ) ;
2002-03-23 11:39:04 +03:00
}
2003-02-24 06:09:08 +03:00
/**
2002-11-12 01:13:05 +03:00
Copy a string from a ucs2 source to a unix char * destination .
Flags can have :
STR_TERMINATE means the string in src is null terminated .
STR_NOALIGN means don ' t try to align .
if STR_TERMINATE is set then src_len is ignored if it is - 1.
src_len is the length of the source area in bytes
Return the number of bytes occupied by the string in src .
The resulting string in " dest " is always null terminated .
2003-02-24 06:09:08 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t pull_ucs2 ( const void * base_ptr , char * dest , const void * src , size_t dest_len , size_t src_len , int flags )
1998-01-17 10:08:21 +03:00
{
2002-11-12 01:13:05 +03:00
size_t ret ;
2001-07-04 11:15:53 +04:00
2002-11-12 01:13:05 +03:00
if ( dest_len = = ( size_t ) - 1 )
2001-07-04 11:15:53 +04:00
dest_len = sizeof ( pstring ) ;
1998-01-17 10:08:21 +03:00
2001-07-04 11:15:53 +04:00
if ( ucs2_align ( base_ptr , src , flags ) ) {
src = ( const void * ) ( ( const char * ) src + 1 ) ;
2002-11-12 01:13:05 +03:00
if ( src_len > 0 )
src_len - - ;
2001-07-04 11:15:53 +04:00
}
1999-12-13 16:27:58 +03:00
2002-07-15 14:35:28 +04:00
if ( flags & STR_TERMINATE ) {
2002-11-12 01:13:05 +03:00
if ( src_len = = ( size_t ) - 1 ) {
2002-07-15 14:35:28 +04:00
src_len = strlen_w ( src ) * 2 + 2 ;
} else {
2002-11-12 01:13:05 +03:00
size_t len = strnlen_w ( src , src_len / 2 ) ;
if ( len < src_len / 2 )
len + + ;
2002-07-15 14:35:28 +04:00
src_len = len * 2 ;
}
}
1999-12-13 16:27:58 +03:00
2001-07-25 08:00:40 +04:00
/* ucs2 is always a multiple of 2 bytes */
2002-11-12 01:13:05 +03:00
if ( src_len ! = ( size_t ) - 1 )
2002-08-17 21:00:51 +04:00
src_len & = ~ 1 ;
2001-07-25 08:00:40 +04:00
2001-09-07 18:14:57 +04:00
ret = convert_string ( CH_UCS2 , CH_UNIX , src , src_len , dest , dest_len ) ;
2002-11-12 01:13:05 +03:00
if ( dest_len )
dest [ MIN ( ret , dest_len - 1 ) ] = 0 ;
1999-12-13 16:27:58 +03:00
2001-07-04 11:15:53 +04:00
return src_len ;
}
1999-12-13 16:27:58 +03:00
2002-11-12 01:13:05 +03:00
size_t pull_ucs2_pstring ( char * dest , const void * src )
2001-07-04 11:15:53 +04:00
{
return pull_ucs2 ( NULL , dest , src , sizeof ( pstring ) , - 1 , STR_TERMINATE ) ;
1999-12-13 16:27:58 +03:00
}
2002-11-12 01:13:05 +03:00
size_t pull_ucs2_fstring ( char * dest , const void * src )
1996-05-04 11:50:46 +04:00
{
2001-07-04 11:15:53 +04:00
return pull_ucs2 ( NULL , dest , src , sizeof ( fstring ) , - 1 , STR_TERMINATE ) ;
1996-05-04 11:50:46 +04:00
}
2002-03-25 10:41:42 +03:00
/**
* Copy a string from a UCS2 src to a unix char * destination , allocating a buffer using talloc
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-03-25 10:41:42 +03:00
* */
2002-11-12 01:13:05 +03:00
2003-02-12 04:09:35 +03:00
size_t pull_ucs2_talloc ( TALLOC_CTX * ctx , char * * dest , const smb_ucs2_t * src )
2002-03-25 10:41:42 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = ( strlen_w ( src ) + 1 ) * sizeof ( smb_ucs2_t ) ;
2002-03-25 10:41:42 +03:00
* dest = NULL ;
2003-02-12 04:09:35 +03:00
return convert_string_talloc ( ctx , CH_UCS2 , CH_UNIX , src , src_len , ( void * * ) dest ) ;
2002-03-25 10:41:42 +03:00
}
/**
* Copy a string from a UCS2 src to a unix char * destination , allocating a buffer
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-03-25 10:41:42 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t pull_ucs2_allocate ( void * * dest , const smb_ucs2_t * src )
2002-03-25 10:41:42 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = ( strlen_w ( src ) + 1 ) * sizeof ( smb_ucs2_t ) ;
2002-03-25 10:41:42 +03:00
* dest = NULL ;
return convert_string_allocate ( CH_UCS2 , CH_UNIX , src , src_len , dest ) ;
}
2002-03-23 11:39:04 +03:00
/**
* Copy a string from a UTF - 8 src to a unix char * destination , allocating a buffer using talloc
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-03-23 11:39:04 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t pull_utf8_talloc ( TALLOC_CTX * ctx , char * * dest , const char * src )
2002-03-23 11:39:04 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) + 1 ;
2002-03-23 11:39:04 +03:00
* dest = NULL ;
2002-08-17 21:00:51 +04:00
return convert_string_talloc ( ctx , CH_UTF8 , CH_UNIX , src , src_len , ( void * * ) dest ) ;
2002-03-23 11:39:04 +03:00
}
/**
* Copy a string from a UTF - 8 src to a unix char * destination , allocating a buffer
*
* @ param dest always set at least to NULL
*
2003-02-24 06:09:08 +03:00
* @ returns The number of bytes occupied by the string in the destination
2002-03-23 11:39:04 +03:00
* */
2002-11-12 01:13:05 +03:00
size_t pull_utf8_allocate ( void * * dest , const char * src )
2002-03-23 11:39:04 +03:00
{
2002-11-12 01:13:05 +03:00
size_t src_len = strlen ( src ) + 1 ;
2002-03-23 11:39:04 +03:00
* dest = NULL ;
return convert_string_allocate ( CH_UTF8 , CH_UNIX , src , src_len , dest ) ;
}
2003-02-24 06:09:08 +03:00
/**
2002-11-12 01:13:05 +03:00
Copy a string from a char * src to a unicode or ascii
dos codepage destination choosing unicode or ascii based on the
flags in the SMB buffer starting at base_ptr .
Return the number of bytes occupied by the string in the destination .
flags can have :
STR_TERMINATE means include the null termination .
STR_UPPER means uppercase in the destination .
STR_ASCII use ascii even with unicode packet .
STR_NOALIGN means don ' t do alignment .
dest_len is the maximum length allowed in the destination . If dest_len
is - 1 then no maxiumum is used .
2003-02-24 06:09:08 +03:00
* */
2002-11-12 01:13:05 +03:00
2003-03-18 04:48:11 +03:00
size_t push_string_fn ( const char * function , unsigned int line , const void * base_ptr , void * dest , const char * src , size_t dest_len , int flags )
1996-05-04 11:50:46 +04:00
{
2003-03-18 04:48:11 +03:00
if ( dest_len ! = ( size_t ) - 1 )
clobber_region ( function , line , dest , dest_len ) ;
2001-07-04 11:15:53 +04:00
if ( ! ( flags & STR_ASCII ) & & \
( ( flags & STR_UNICODE | | \
( SVAL ( base_ptr , smb_flg2 ) & FLAGS2_UNICODE_STRINGS ) ) ) ) {
return push_ucs2 ( base_ptr , dest , src , dest_len , flags ) ;
}
return push_ascii ( dest , src , dest_len , flags ) ;
1996-05-04 11:50:46 +04:00
}
2003-02-24 06:09:08 +03:00
/**
2002-11-12 01:13:05 +03:00
Copy a string from a unicode or ascii source ( depending on
the packet flags ) to a char * destination .
Flags can have :
STR_TERMINATE means the string in src is null terminated .
STR_UNICODE means to force as unicode .
STR_ASCII use ascii even with unicode packet .
STR_NOALIGN means don ' t do alignment .
if STR_TERMINATE is set then src_len is ignored is it is - 1
src_len is the length of the source area in bytes .
Return the number of bytes occupied by the string in src .
The resulting string in " dest " is always null terminated .
2003-02-24 06:09:08 +03:00
* */
2002-11-12 01:13:05 +03:00
2003-03-18 04:48:11 +03:00
size_t pull_string_fn ( const char * function , unsigned int line , const void * base_ptr , char * dest , const void * src , size_t dest_len , size_t src_len , int flags )
2001-07-04 11:15:53 +04:00
{
2003-03-18 04:48:11 +03:00
if ( dest_len ! = ( size_t ) - 1 )
clobber_region ( function , line , dest , dest_len ) ;
2001-07-04 11:15:53 +04:00
if ( ! ( flags & STR_ASCII ) & & \
( ( flags & STR_UNICODE | | \
( SVAL ( base_ptr , smb_flg2 ) & FLAGS2_UNICODE_STRINGS ) ) ) ) {
return pull_ucs2 ( base_ptr , dest , src , dest_len , src_len , flags ) ;
}
return pull_ascii ( dest , src , dest_len , src_len , flags ) ;
}
2002-11-12 01:13:05 +03:00
size_t align_string ( const void * base_ptr , const char * p , int flags )
1996-05-04 11:50:46 +04:00
{
2001-07-04 11:15:53 +04:00
if ( ! ( flags & STR_ASCII ) & & \
( ( flags & STR_UNICODE | | \
( SVAL ( base_ptr , smb_flg2 ) & FLAGS2_UNICODE_STRINGS ) ) ) ) {
return ucs2_align ( base_ptr , p , flags ) ;
}
return 0 ;
1996-05-04 11:50:46 +04:00
}
2001-11-10 18:21:54 +03:00
2003-02-24 06:09:08 +03:00
/**
2002-11-12 01:13:05 +03:00
Convert from unix to ucs2 charset and return the
allocated and converted string or NULL if an error occurred .
You must provide a zero terminated string .
The returning string will be zero terminated .
2003-02-24 06:09:08 +03:00
* */
2002-11-12 01:13:05 +03:00
2001-11-10 18:21:54 +03:00
smb_ucs2_t * acnv_uxu2 ( const char * src )
{
size_t slen ;
size_t dlen ;
void * dest ;
slen = strlen ( src ) + 1 ;
dlen = convert_string_allocate ( CH_UNIX , CH_UCS2 , src , slen , & dest ) ;
2002-11-12 01:13:05 +03:00
if ( dlen = = ( size_t ) - 1 )
return NULL ;
else
return dest ;
2001-11-10 18:21:54 +03:00
}
2001-11-12 03:53:34 +03:00
2003-02-24 06:09:08 +03:00
/**
2002-11-12 01:13:05 +03:00
Convert from dos to ucs2 charset and return the
allocated and converted string or NULL if an error occurred .
You must provide a zero terminated string .
The returning string will be zero terminated .
2003-02-24 06:09:08 +03:00
* */
2002-11-12 01:13:05 +03:00
2001-11-12 03:53:34 +03:00
smb_ucs2_t * acnv_dosu2 ( const char * src )
{
size_t slen ;
size_t dlen ;
void * dest ;
slen = strlen ( src ) + 1 ;
dlen = convert_string_allocate ( CH_DOS , CH_UCS2 , src , slen , & dest ) ;
2002-11-12 01:13:05 +03:00
if ( dlen = = ( size_t ) - 1 )
return NULL ;
else
return dest ;
2001-11-12 03:53:34 +03:00
}