1998b56c3Sdanielk1977 /*
2998b56c3Sdanielk1977 ** 2001 September 15
3998b56c3Sdanielk1977 **
4998b56c3Sdanielk1977 ** The author disclaims copyright to this source code. In place of
5998b56c3Sdanielk1977 ** a legal notice, here is a blessing:
6998b56c3Sdanielk1977 **
7998b56c3Sdanielk1977 ** May you do good and not evil.
8998b56c3Sdanielk1977 ** May you find forgiveness for yourself and forgive others.
9998b56c3Sdanielk1977 ** May you share freely, never taking more than you give.
10998b56c3Sdanielk1977 **
11998b56c3Sdanielk1977 *************************************************************************
12998b56c3Sdanielk1977 ** Code for testing the utf.c module in SQLite. This code
13998b56c3Sdanielk1977 ** is not included in the SQLite library. It is used for automated
14295ba55aSdanielk1977 ** testing of the SQLite library. Specifically, the code in this file
15295ba55aSdanielk1977 ** is used for testing the SQLite routines for converting between
16295ba55aSdanielk1977 ** the various supported unicode encodings.
17998b56c3Sdanielk1977 */
18998b56c3Sdanielk1977 #include "sqliteInt.h"
190202b29eSdanielk1977 #include "vdbeInt.h"
2052b1dbb5Smistachkin #if defined(INCLUDE_SQLITE_TCL_H)
2152b1dbb5Smistachkin # include "sqlite_tcl.h"
2252b1dbb5Smistachkin #else
23998b56c3Sdanielk1977 # include "tcl.h"
2452b1dbb5Smistachkin #endif
25998b56c3Sdanielk1977 #include <stdlib.h>
26998b56c3Sdanielk1977 #include <string.h>
27998b56c3Sdanielk1977
28998b56c3Sdanielk1977 /*
29295ba55aSdanielk1977 ** The first argument is a TCL UTF-8 string. Return the byte array
30295ba55aSdanielk1977 ** object with the encoded representation of the string, including
31295ba55aSdanielk1977 ** the NULL terminator.
32295ba55aSdanielk1977 */
binarize(void * clientData,Tcl_Interp * interp,int objc,Tcl_Obj * CONST objv[])33*7617e4a8Smistachkin static int SQLITE_TCLAPI binarize(
34295ba55aSdanielk1977 void * clientData,
35295ba55aSdanielk1977 Tcl_Interp *interp,
36295ba55aSdanielk1977 int objc,
37295ba55aSdanielk1977 Tcl_Obj *CONST objv[]
38295ba55aSdanielk1977 ){
39295ba55aSdanielk1977 int len;
40295ba55aSdanielk1977 char *bytes;
41295ba55aSdanielk1977 Tcl_Obj *pRet;
42295ba55aSdanielk1977 assert(objc==2);
43295ba55aSdanielk1977
44295ba55aSdanielk1977 bytes = Tcl_GetStringFromObj(objv[1], &len);
4503d847eaSdrh pRet = Tcl_NewByteArrayObj((u8*)bytes, len+1);
46295ba55aSdanielk1977 Tcl_SetObjResult(interp, pRet);
47295ba55aSdanielk1977 return TCL_OK;
48295ba55aSdanielk1977 }
49295ba55aSdanielk1977
500202b29eSdanielk1977 /*
510202b29eSdanielk1977 ** Usage: test_value_overhead <repeat-count> <do-calls>.
520202b29eSdanielk1977 **
530202b29eSdanielk1977 ** This routine is used to test the overhead of calls to
540202b29eSdanielk1977 ** sqlite3_value_text(), on a value that contains a UTF-8 string. The idea
550202b29eSdanielk1977 ** is to figure out whether or not it is a problem to use sqlite3_value
560202b29eSdanielk1977 ** structures with collation sequence functions.
570202b29eSdanielk1977 **
580202b29eSdanielk1977 ** If <do-calls> is 0, then the calls to sqlite3_value_text() are not
590202b29eSdanielk1977 ** actually made.
600202b29eSdanielk1977 */
test_value_overhead(void * clientData,Tcl_Interp * interp,int objc,Tcl_Obj * CONST objv[])61*7617e4a8Smistachkin static int SQLITE_TCLAPI test_value_overhead(
620202b29eSdanielk1977 void * clientData,
630202b29eSdanielk1977 Tcl_Interp *interp,
640202b29eSdanielk1977 int objc,
650202b29eSdanielk1977 Tcl_Obj *CONST objv[]
660202b29eSdanielk1977 ){
670202b29eSdanielk1977 int do_calls;
680202b29eSdanielk1977 int repeat_count;
690202b29eSdanielk1977 int i;
700202b29eSdanielk1977 Mem val;
710202b29eSdanielk1977
720202b29eSdanielk1977 if( objc!=3 ){
730202b29eSdanielk1977 Tcl_AppendResult(interp, "wrong # args: should be \"",
740202b29eSdanielk1977 Tcl_GetStringFromObj(objv[0], 0), " <repeat-count> <do-calls>", 0);
750202b29eSdanielk1977 return TCL_ERROR;
760202b29eSdanielk1977 }
770202b29eSdanielk1977
780202b29eSdanielk1977 if( Tcl_GetIntFromObj(interp, objv[1], &repeat_count) ) return TCL_ERROR;
790202b29eSdanielk1977 if( Tcl_GetIntFromObj(interp, objv[2], &do_calls) ) return TCL_ERROR;
800202b29eSdanielk1977
810202b29eSdanielk1977 val.flags = MEM_Str|MEM_Term|MEM_Static;
820202b29eSdanielk1977 val.z = "hello world";
83dc8453fdSdanielk1977 val.enc = SQLITE_UTF8;
840202b29eSdanielk1977
850202b29eSdanielk1977 for(i=0; i<repeat_count; i++){
860202b29eSdanielk1977 if( do_calls ){
87caffb1a5Sdrh sqlite3_value_text(&val);
880202b29eSdanielk1977 }
890202b29eSdanielk1977 }
900202b29eSdanielk1977
910202b29eSdanielk1977 return TCL_OK;
920202b29eSdanielk1977 }
930202b29eSdanielk1977
name_to_enc(Tcl_Interp * interp,Tcl_Obj * pObj)94bfd6cce5Sdanielk1977 static u8 name_to_enc(Tcl_Interp *interp, Tcl_Obj *pObj){
95bfd6cce5Sdanielk1977 struct EncName {
96bfd6cce5Sdanielk1977 char *zName;
97bfd6cce5Sdanielk1977 u8 enc;
98bfd6cce5Sdanielk1977 } encnames[] = {
99bfd6cce5Sdanielk1977 { "UTF8", SQLITE_UTF8 },
100bfd6cce5Sdanielk1977 { "UTF16LE", SQLITE_UTF16LE },
101bfd6cce5Sdanielk1977 { "UTF16BE", SQLITE_UTF16BE },
10244a376f6Sdanielk1977 { "UTF16", SQLITE_UTF16 },
103bfd6cce5Sdanielk1977 { 0, 0 }
104bfd6cce5Sdanielk1977 };
105bfd6cce5Sdanielk1977 struct EncName *pEnc;
106bfd6cce5Sdanielk1977 char *z = Tcl_GetString(pObj);
107bfd6cce5Sdanielk1977 for(pEnc=&encnames[0]; pEnc->zName; pEnc++){
108bfd6cce5Sdanielk1977 if( 0==sqlite3StrICmp(z, pEnc->zName) ){
109bfd6cce5Sdanielk1977 break;
110bfd6cce5Sdanielk1977 }
111bfd6cce5Sdanielk1977 }
112bfd6cce5Sdanielk1977 if( !pEnc->enc ){
113bfd6cce5Sdanielk1977 Tcl_AppendResult(interp, "No such encoding: ", z, 0);
114bfd6cce5Sdanielk1977 }
11544a376f6Sdanielk1977 if( pEnc->enc==SQLITE_UTF16 ){
11644a376f6Sdanielk1977 return SQLITE_UTF16NATIVE;
11744a376f6Sdanielk1977 }
118bfd6cce5Sdanielk1977 return pEnc->enc;
119bfd6cce5Sdanielk1977 }
120bfd6cce5Sdanielk1977
1211ba1b551Sdanielk1977 /*
1221ba1b551Sdanielk1977 ** Usage: test_translate <string/blob> <from enc> <to enc> ?<transient>?
1231ba1b551Sdanielk1977 **
1241ba1b551Sdanielk1977 */
test_translate(void * clientData,Tcl_Interp * interp,int objc,Tcl_Obj * CONST objv[])125*7617e4a8Smistachkin static int SQLITE_TCLAPI test_translate(
126bfd6cce5Sdanielk1977 void * clientData,
127bfd6cce5Sdanielk1977 Tcl_Interp *interp,
128bfd6cce5Sdanielk1977 int objc,
129bfd6cce5Sdanielk1977 Tcl_Obj *CONST objv[]
130bfd6cce5Sdanielk1977 ){
131bfd6cce5Sdanielk1977 u8 enc_from;
132bfd6cce5Sdanielk1977 u8 enc_to;
133bfd6cce5Sdanielk1977 sqlite3_value *pVal;
134bfd6cce5Sdanielk1977
1351ba1b551Sdanielk1977 char *z;
136bfd6cce5Sdanielk1977 int len;
1371ba1b551Sdanielk1977 void (*xDel)(void *p) = SQLITE_STATIC;
138bfd6cce5Sdanielk1977
1391ba1b551Sdanielk1977 if( objc!=4 && objc!=5 ){
140bfd6cce5Sdanielk1977 Tcl_AppendResult(interp, "wrong # args: should be \"",
141bfd6cce5Sdanielk1977 Tcl_GetStringFromObj(objv[0], 0),
142bfd6cce5Sdanielk1977 " <string/blob> <from enc> <to enc>", 0
143bfd6cce5Sdanielk1977 );
144bfd6cce5Sdanielk1977 return TCL_ERROR;
145bfd6cce5Sdanielk1977 }
1461ba1b551Sdanielk1977 if( objc==5 ){
1471e536953Sdanielk1977 xDel = sqlite3_free;
1481ba1b551Sdanielk1977 }
149bfd6cce5Sdanielk1977
150bfd6cce5Sdanielk1977 enc_from = name_to_enc(interp, objv[2]);
151bfd6cce5Sdanielk1977 if( !enc_from ) return TCL_ERROR;
152bfd6cce5Sdanielk1977 enc_to = name_to_enc(interp, objv[3]);
153bfd6cce5Sdanielk1977 if( !enc_to ) return TCL_ERROR;
154bfd6cce5Sdanielk1977
1551e536953Sdanielk1977 pVal = sqlite3ValueNew(0);
156bfd6cce5Sdanielk1977
157bfd6cce5Sdanielk1977 if( enc_from==SQLITE_UTF8 ){
158bfd6cce5Sdanielk1977 z = Tcl_GetString(objv[1]);
1591ba1b551Sdanielk1977 if( objc==5 ){
160b975598eSdrh z = sqlite3_mprintf("%s", z);
1611ba1b551Sdanielk1977 }
162b21c8cd4Sdrh sqlite3ValueSetStr(pVal, -1, z, enc_from, xDel);
163bfd6cce5Sdanielk1977 }else{
16403d847eaSdrh z = (char*)Tcl_GetByteArrayFromObj(objv[1], &len);
1651ba1b551Sdanielk1977 if( objc==5 ){
1661ba1b551Sdanielk1977 char *zTmp = z;
16717435752Sdrh z = sqlite3_malloc(len);
1681ba1b551Sdanielk1977 memcpy(z, zTmp, len);
1691ba1b551Sdanielk1977 }
170b21c8cd4Sdrh sqlite3ValueSetStr(pVal, -1, z, enc_from, xDel);
171bfd6cce5Sdanielk1977 }
172bfd6cce5Sdanielk1977
173b21c8cd4Sdrh z = (char *)sqlite3ValueText(pVal, enc_to);
174b21c8cd4Sdrh len = sqlite3ValueBytes(pVal, enc_to) + (enc_to==SQLITE_UTF8?1:2);
17503d847eaSdrh Tcl_SetObjResult(interp, Tcl_NewByteArrayObj((u8*)z, len));
176bfd6cce5Sdanielk1977
177bfd6cce5Sdanielk1977 sqlite3ValueFree(pVal);
178bfd6cce5Sdanielk1977
179bfd6cce5Sdanielk1977 return TCL_OK;
180bfd6cce5Sdanielk1977 }
181bfd6cce5Sdanielk1977
182bfd6cce5Sdanielk1977 /*
183bfd6cce5Sdanielk1977 ** Usage: translate_selftest
184bfd6cce5Sdanielk1977 **
185ee85813cSdrh ** Call sqlite3UtfSelfTest() to run the internal tests for unicode
186bfd6cce5Sdanielk1977 ** translation. If there is a problem an assert() will fail.
187bfd6cce5Sdanielk1977 **/
18844a376f6Sdanielk1977 void sqlite3UtfSelfTest(void);
test_translate_selftest(void * clientData,Tcl_Interp * interp,int objc,Tcl_Obj * CONST objv[])189*7617e4a8Smistachkin static int SQLITE_TCLAPI test_translate_selftest(
190bfd6cce5Sdanielk1977 void * clientData,
191bfd6cce5Sdanielk1977 Tcl_Interp *interp,
192bfd6cce5Sdanielk1977 int objc,
193bfd6cce5Sdanielk1977 Tcl_Obj *CONST objv[]
194bfd6cce5Sdanielk1977 ){
1956c62608fSdrh #ifndef SQLITE_OMIT_UTF16
196ee85813cSdrh sqlite3UtfSelfTest();
1976c62608fSdrh #endif
198bfd6cce5Sdanielk1977 return SQLITE_OK;
199bfd6cce5Sdanielk1977 }
200bfd6cce5Sdanielk1977
201998b56c3Sdanielk1977
202998b56c3Sdanielk1977 /*
203998b56c3Sdanielk1977 ** Register commands with the TCL interpreter.
204998b56c3Sdanielk1977 */
Sqlitetest5_Init(Tcl_Interp * interp)205998b56c3Sdanielk1977 int Sqlitetest5_Init(Tcl_Interp *interp){
206998b56c3Sdanielk1977 static struct {
207998b56c3Sdanielk1977 char *zName;
208295ba55aSdanielk1977 Tcl_ObjCmdProc *xProc;
209998b56c3Sdanielk1977 } aCmd[] = {
21024162fe6Sdanielk1977 { "binarize", (Tcl_ObjCmdProc*)binarize },
2110202b29eSdanielk1977 { "test_value_overhead", (Tcl_ObjCmdProc*)test_value_overhead },
212bfd6cce5Sdanielk1977 { "test_translate", (Tcl_ObjCmdProc*)test_translate },
213bfd6cce5Sdanielk1977 { "translate_selftest", (Tcl_ObjCmdProc*)test_translate_selftest},
214998b56c3Sdanielk1977 };
215998b56c3Sdanielk1977 int i;
216998b56c3Sdanielk1977 for(i=0; i<sizeof(aCmd)/sizeof(aCmd[0]); i++){
217295ba55aSdanielk1977 Tcl_CreateObjCommand(interp, aCmd[i].zName, aCmd[i].xProc, 0, 0);
218998b56c3Sdanielk1977 }
2190202b29eSdanielk1977 return SQLITE_OK;
220998b56c3Sdanielk1977 }
221