My favorites | Sign in
Project Home Downloads Wiki Issues Source
Checkout   Browse   Changes    
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
//
// $Id$
//

//
// Sphinx UDF function example
//
// Linux
// gcc -fPIC -shared -o udfexample.so udfexample.c
// CREATE FUNCTION sequence RETURNS INT SONAME 'udfexample.so';
// CREATE FUNCTION strtoint RETURNS INT SONAME 'udfexample.so';
// CREATE FUNCTION avgmva RETURNS FLOAT SONAME 'udfexample.so';
//
// Windows
// cl /MTd /LD udfexample.c
// CREATE FUNCTION sequence RETURNS INT SONAME 'udfexample.dll';
// CREATE FUNCTION strtoint RETURNS INT SONAME 'udfexample.dll';
// CREATE FUNCTION avgmva RETURNS FLOAT SONAME 'udfexample.dll';
//

#include "sphinxudf.h"
#include <stdio.h>
#include <string.h>
#include <stdlib.h>

#ifdef _MSC_VER
#define snprintf _snprintf
#define DLLEXPORT __declspec(dllexport)
#else
#define DLLEXPORT
#endif

/// UDF initialization
/// gets called on every query, when query begins
/// args are filled with values for a particular query
DLLEXPORT int sequence_init ( SPH_UDF_INIT * init, SPH_UDF_ARGS * args, char * error_message )
{
// check argument count
if ( args->arg_count > 1 )
{
snprintf ( error_message, SPH_UDF_ERROR_LEN, "SEQUENCE() takes either 0 or 1 arguments" );
return 1;
}

// check argument type
if ( args->arg_count && args->arg_types[0]!=SPH_UDF_TYPE_UINT32 )
{
snprintf ( error_message, SPH_UDF_ERROR_LEN, "SEQUENCE() requires 1st argument to be uint" );
return 1;
}

// allocate and init counter storage
init->func_data = (void*) malloc ( sizeof(int) );
if ( !init->func_data )
{
snprintf ( error_message, SPH_UDF_ERROR_LEN, "malloc() failed" );
return 1;
}
*(int*)init->func_data = 1;

// all done
return 0;
}


/// UDF deinitialization
/// gets called on every query, when query ends
DLLEXPORT void sequence_deinit ( SPH_UDF_INIT * init )
{
// deallocate storage
if ( init->func_data )
{
free ( init->func_data );
init->func_data = NULL;
}
}


/// UDF implementation
/// gets called for every row, unless optimized away
DLLEXPORT sphinx_int64_t sequence ( SPH_UDF_INIT * init, SPH_UDF_ARGS * args, char * error_flag )
{
int res = (*(int*)init->func_data)++;
if ( args->arg_count )
res += *(int*)args->arg_values[0];
return res;
}

//////////////////////////////////////////////////////////////////////////

DLLEXPORT int strtoint_init ( SPH_UDF_INIT * init, SPH_UDF_ARGS * args, char * error_message )
{
if ( args->arg_count!=1 || args->arg_types[0]!=SPH_UDF_TYPE_STRING )
{
snprintf ( error_message, SPH_UDF_ERROR_LEN, "STRTOINT() requires 1 string argument" );
return 1;
}
return 0;
}

DLLEXPORT sphinx_int64_t strtoint ( SPH_UDF_INIT * init, SPH_UDF_ARGS * args, char * error_flag )
{
const char * s = args->arg_values[0];
int len = args->str_lengths[0], res = 0;

while ( len>0 && *s>='0' && *s<='9' )
{
res += *s - '0';
len--;
}

return res;
}

//////////////////////////////////////////////////////////////////////////

DLLEXPORT int avgmva_init ( SPH_UDF_INIT * init, SPH_UDF_ARGS * args, char * error_message )
{
if ( args->arg_count!=1 ||
( args->arg_types[0]!=SPH_UDF_TYPE_UINT32SET && args->arg_types[0]!=SPH_UDF_TYPE_UINT64SET ) )
{
snprintf ( error_message, SPH_UDF_ERROR_LEN, "AVGMVA() requires 1 MVA argument" );
return 1;
}

// store our mva vs mva64 flag to func_data
init->func_data = (void*)(int)( args->arg_types[0]==SPH_UDF_TYPE_UINT64SET ? 1 : 0 );
return 0;
}

DLLEXPORT double avgmva ( SPH_UDF_INIT * init, SPH_UDF_ARGS * args, char * error_flag )
{
unsigned int * mva = (unsigned int *) args->arg_values[0];
double res = 0;
int i, n, is64;

if ( !mva )
return res;

// Both MVA32 and MVA64 are stored as dword (unsigned 32-bit) arrays.
// The first dword stores the array length (always in dwords too), and
// the next ones store the values. In pseudocode:
//
// unsigned int num_dwords
// unsigned int data [ num_dwords ]
//
// With MVA32, this lets you access the values pretty naturally.
//
// With MVA64, however, we have to do a few tricks:
// a) divide num_dwords by 2 to get the number of 64-bit elements,
// b) assemble those 64-bit values from dword pairs.
//
// The latter is required for architectures where non-aligned
// 64-bit access crashes. On Intel, we could have also done it
// like this:
//
// int * raw_ptr = (int*) args->arg_values[0];
// int mva64_count = (*raw_ptr) / 2;
// sphinx_uint64_t * mva64_values = (sphinx_uint64_t*)(raw_ptr + 1);

// pull "mva32 or mva64" flag (that we stored in _init) from func_data
is64 = (int)(init->func_data) != 0;
if ( is64 )
{
// handle mva64
n = *mva++ / 2;
for ( i=0; i<n; i++ )
{
res += (((sphinx_uint64_t)mva[1]) << 32) + mva[0];
mva += 2;
}
} else
{
// handle mva32
n = *mva++;
for ( i=0; i<n; i++ )
res += *mva++;
}

return res/n;
}

//
// $Id$
//

Change log

r3116 by klirichek on Feb 22, 2012   Diff
merged rel20 branch (upto r3115) back into
trunk
Go to: 
Project members, sign in to write a code review

Older revisions

r2681 by shodan on Feb 19, 2011   Diff
fixed eol-style

r2651 by shodan on Jan 27, 2011   Diff
added UDF support (plugin_dir
directive; CREATE/DROP FUNCTION
statements)

All revisions of this file

File info

Size: 4729 bytes, 185 lines

File properties

svn:eol-style
native
Powered by Google Project Hosting