-
Notifications
You must be signed in to change notification settings - Fork 5
/
Copy pathicu_replace.c
154 lines (139 loc) · 4.35 KB
/
icu_replace.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
/*
** 2012 February 12
**
** The author disclaims copyright to this source code. In place of
** a legal notice, here is a blessing:
**
** May you do good and not evil.
** May you find forgiveness for yourself and forgive others.
** May you share freely, never taking more than you give.
**
*************************************************************************
** This file contains code for SQLite extension that uses icu to provide a regex_replace() function.
*/
#include <assert.h>
/* Include ICU headers */
#include <unicode/utypes.h>
#include <unicode/uregex.h>
#include <unicode/ustring.h>
#include <sqlite3ext.h>
SQLITE_EXTENSION_INIT1
/* stolen from icu standard extension */
static void xFree(void *p){
sqlite3_free(p);
}
/* stolen from icu standard extension */
static void icuFunctionError(
sqlite3_context *pCtx,
const char *zName,
UErrorCode e
){
char zBuf[128];
sqlite3_snprintf(128, zBuf, "ICU error: %s(): %s", zName, u_errorName(e));
zBuf[127] = '\0';
sqlite3_result_error(pCtx, zBuf, -1);
}
/* stolen from icu standard extension */
static void icuRegexpDelete(void *p){
URegularExpression *pExpr = (URegularExpression *)p;
uregex_close(pExpr);
}
static void icuReplaceAllFunc(
sqlite3_context *context,
int argc,
sqlite3_value **argv
){
UErrorCode status = U_ZERO_ERROR;
URegularExpression *pExpr;
const UChar *zInput; /* Pointer to input string */
UChar *zOutput = 0; /* Pointer to output buffer */
int nOut; /* Size of output buffer in bytes */
int cnt;
(void)argc; /* Unused parameter */
zInput = sqlite3_value_text16(argv[1]);
/* If the text is NULL, then the result is also NULL. */
if( !zInput ){
return;
}
const UChar *zReplacement = sqlite3_value_text16(argv[2]);
if ( !zReplacement ) {
sqlite3_result_error(context, "no replacement string", -1);
return;
}
pExpr = sqlite3_get_auxdata(context, 0);
if( !pExpr ){
const UChar *zPattern = sqlite3_value_text16(argv[0]);
if( !zPattern ){
return;
}
pExpr = uregex_open(zPattern, -1, 0, 0, &status);
if( U_SUCCESS(status) ){
sqlite3_set_auxdata(context, 0, pExpr, icuRegexpDelete);
}else{
assert(!pExpr);
icuFunctionError(context, "uregex_open", status);
return;
}
}
/* Configure the text that the regular expression operates on. */
uregex_setText(pExpr, zInput, -1, &status);
if( !U_SUCCESS(status) ){
icuFunctionError(context, "uregex_setText", status);
return;
}
/* Expect output length = input length. */
nOut = sqlite3_value_bytes16(argv[1]);
if( nOut==0 ){ // or output length = replacement length
nOut = sqlite3_value_bytes16(argv[2]);
}
if( nOut==0 ){ // if both input and replacement are empty
sqlite3_result_text16(context, "", 0, SQLITE_STATIC);
return;
}
/*
int32_t uregex_replaceAll (URegularExpression *regexp, const UChar *replacementText, int32_t replacementLength, UChar *destBuf, int32_t destCapacity, UErrorCode *status)
*/
for(cnt=0; cnt<2; cnt++){
UChar *zNew = sqlite3_realloc(zOutput, nOut);
if( zNew==0 ){
sqlite3_free(zOutput);
sqlite3_result_error_nomem(context);
return;
}
zOutput = zNew;
status = U_ZERO_ERROR;
/* Attempt the replace */
nOut = 2*uregex_replaceAll(pExpr, zReplacement, -1, zOutput, nOut/2, &status);
if( status==U_BUFFER_OVERFLOW_ERROR ){
assert( cnt==0 );
continue;
}
break;
}
if( !U_SUCCESS(status) ){
sqlite3_free(zOutput);
icuFunctionError(context, "uregex_replaceAll", status);
return;
}
/* Set the text that the regular expression operates on to a NULL
** pointer. This is not really necessary, but it is tidier than
** leaving the regular expression object configured with an invalid
** pointer after this function returns.
*/
uregex_setText(pExpr, 0, 0, &status);
sqlite3_result_text16(context, zOutput, nOut, xFree);
}
/* SQLite invokes this routine once when it loads the extension.
** Create new functions, collating sequences, and virtual table
** modules here. This is usually the only exported symbol in
** the shared library.
*/
int sqlite3_extension_init(
sqlite3 *db,
char **pzErrMsg,
const sqlite3_api_routines *pApi
){
SQLITE_EXTENSION_INIT2(pApi)
sqlite3_create_function_v2(db, "regex_replace", 3, SQLITE_ANY, 0, icuReplaceAllFunc, NULL, NULL, NULL);
return 0;
}