[925] | 1 | #include "mex.h" |
| 2 | |
| 3 | /* |
| 4 | * $Id: xml_findstr.c 6480 2015-06-13 01:08:30Z guillaume $ |
| 5 | * Guillaume Flandin <guillaume@artefact.tk> |
| 6 | */ |
| 7 | |
| 8 | /* |
| 9 | Differences with built-in findstr: |
| 10 | - allows to search only the n first occurences of a pattern |
| 11 | - allows to search only in a substring (given an index of the beginning) |
| 12 | |
| 13 | MATLAB hack: |
| 14 | - doesn't use mxGetString to prevent a copy of the string. |
| 15 | - assumes MATLAB stores strings as unsigned short (Unicode 16 bits) |
| 16 | matrix.h: typedef uint16_T mxChar; |
| 17 | (that's the case for MATLAB 5.*, 6.* and 7.* but MATLAB 4.* stores |
| 18 | strings as double and GNU Octave as char, see src/mxarray.h) |
| 19 | */ |
| 20 | |
| 21 | /* Comment the following line to use standard mxGetString (slower) */ |
| 22 | #if !defined (HAVE_OCTAVE) |
| 23 | #define __HACK_MXCHAR__ |
| 24 | #endif |
| 25 | |
| 26 | void mexFunction(int nlhs, mxArray *plhs[], int nrhs, const mxArray *prhs[]) { |
| 27 | |
| 28 | unsigned int i, j, stext, spattern, nbmatch = 0, ind = 1, occur = 0, nboccur = 0; |
| 29 | #ifdef __HACK_MXCHAR__ |
| 30 | unsigned short int *text = NULL, *pattern = NULL; |
| 31 | #else |
| 32 | char *text = NULL, *pattern = NULL; |
| 33 | #endif |
| 34 | unsigned int *k = NULL; |
| 35 | mxArray *out = NULL; |
| 36 | |
| 37 | /* Check for proper number of arguments. */ |
| 38 | if ((nrhs == 0) || (nrhs == 1)) |
| 39 | mexErrMsgTxt("Not enough input arguments."); |
| 40 | else if (nrhs > 4) |
| 41 | mexErrMsgTxt("Too many input arguments."); |
| 42 | else if (nlhs > 1) |
| 43 | mexErrMsgTxt("Too many output arguments."); |
| 44 | |
| 45 | /* The input TEXT must be a string */ |
| 46 | if (!mxIsChar(prhs[0])) |
| 47 | mexErrMsgTxt("Inputs must be character arrays."); |
| 48 | stext = mxGetM(prhs[0]) * mxGetN(prhs[0]); |
| 49 | #ifdef __HACK_MXCHAR__ |
| 50 | text = mxGetData(prhs[0]); |
| 51 | #else |
| 52 | text = mxCalloc(stext+1, sizeof(char)); |
| 53 | mxGetString(prhs[0], text, stext+1); |
| 54 | #endif |
| 55 | |
| 56 | /* The input PATTERN must be a string */ |
| 57 | if (!mxIsChar(prhs[1])) |
| 58 | mexErrMsgTxt("Inputs must be character arrays."); |
| 59 | spattern = mxGetM(prhs[1]) * mxGetN(prhs[1]); |
| 60 | #ifdef __HACK_MXCHAR__ |
| 61 | pattern = mxGetData(prhs[1]); |
| 62 | #else |
| 63 | pattern = mxCalloc(spattern+1, sizeof(char)); |
| 64 | mxGetString(prhs[1], pattern, spattern+1); |
| 65 | #endif |
| 66 | |
| 67 | /* The input INDEX must be an integer */ |
| 68 | if (nrhs > 2) { |
| 69 | if ((!mxIsNumeric(prhs[2]) || (mxGetM(prhs[2]) * mxGetN(prhs[2]) != 1))) |
| 70 | mexErrMsgTxt("Index input must be an integer."); |
| 71 | ind = (unsigned int)mxGetScalar(prhs[2]); |
| 72 | if (ind < 1) |
| 73 | mexErrMsgTxt("Index must be greater than 1."); |
| 74 | } |
| 75 | |
| 76 | /* The input OCCUR must be an integer */ |
| 77 | if (nrhs == 4) { |
| 78 | if ((!mxIsNumeric(prhs[3]) || (mxGetM(prhs[3]) * mxGetN(prhs[3]) != 1))) |
| 79 | mexErrMsgTxt("Index input must be an integer."); |
| 80 | nboccur = (unsigned int)mxGetScalar(prhs[3]); |
| 81 | } |
| 82 | |
| 83 | /* Find pattern in text */ |
| 84 | for (i=ind-1;i<stext;i++) { |
| 85 | for (j=0;j<spattern && i+j<stext;j++) { |
| 86 | if (pattern[j] == text[i+j]) { |
| 87 | if (j == spattern-1) { |
| 88 | nbmatch += 1; |
| 89 | k = mxRealloc(k,nbmatch*sizeof(unsigned int)); |
| 90 | k[nbmatch-1] = i+1; |
| 91 | if (++occur == nboccur) i = stext; |
| 92 | } |
| 93 | } |
| 94 | else break; |
| 95 | } |
| 96 | } |
| 97 | |
| 98 | /* Allocate output */ |
| 99 | out = mxCreateDoubleMatrix((nbmatch) ? 1:0, nbmatch, mxREAL); |
| 100 | |
| 101 | /* Copy index array into output */ |
| 102 | for (i=0;i<nbmatch;i++) |
| 103 | mxGetPr(out)[i] = (double)k[i]; |
| 104 | |
| 105 | /* Assign pointer to output */ |
| 106 | plhs[0] = out; |
| 107 | |
| 108 | /* Free memory */ |
| 109 | if (k) mxFree(k); |
| 110 | } |
