19 Star 33 Fork 26

openLooKeng / hetu-odbc-driver

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
克隆/下载
ma_parse.c 15.13 KB
一键复制 编辑 原始数据 按行查看 历史
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568
/************************************************************************************
Copyright (C) 2013,2018 MariaDB Corporation AB
Copyright (C) 2018-2020. Huawei Technologies Co., Ltd. All rights reserved.
This library is free software; you can redistribute it and/or
modify it under the terms of the GNU Library General Public
License as published by the Free Software Foundation; either
version 2.1 of the License, or (at your option) any later version.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
Library General Public License for more details.
You should have received a copy of the GNU Library General Public
License along with this library; if not see <http://www.gnu.org/licenses>
or write to the Free Software Foundation, Inc.,
51 Franklin St., Fifth Floor, Boston, MA 02110, USA
*************************************************************************************/
#include <ma_odbc.h>
/* Minimal query length when we tried to avoid full parsing */
#define QUERY_LEN_FOR_POOR_MAN_PARSING 32768
char* SkipSpacesAndComments(char **CurPtr, size_t *Length, BOOL OverWrite)
{
char *End= *CurPtr + *Length, *Prev= NULL;
/* Making sure that we don't have leading whitespaces and/or comments,
and the string begins from something meainingful */
while (*CurPtr < End && *CurPtr != Prev)
{
Prev= *CurPtr;
*CurPtr= StripLeadingComments(*CurPtr, Length, OverWrite);
*CurPtr= ltrim(*CurPtr);
*Length= strlen(*CurPtr);
}
return *CurPtr;
}
char* SkipQuotedString(char **CurPtr, char *End, char Quote)
{
while (*CurPtr < End && **CurPtr != Quote)
{
/* Skipping backslash and next character, if needed */
if (**CurPtr == '\\')
{
++*CurPtr;
/* Taking care of the case, when backslash is at last position */
if (*CurPtr == End)
{
break;
}
}
++*CurPtr;
}
return *CurPtr;
}
char* SkipQuotedString_Noescapes(char **CurPtr, char *End, char Quote)
{
while (*CurPtr < End && **CurPtr != Quote)
{
++*CurPtr;
}
return *CurPtr;
}
int MADB_ResetParser(MADB_Stmt *Stmt, char *OriginalQuery, SQLINTEGER OriginalLength)
{
MADB_DeleteQuery(&Stmt->Query);
if (OriginalQuery != NULL)
{
/* We can have here not NULL-terminated string as a source, thus we need to allocate, copy meaningful characters and
add NULL. strndup does that for us. StmtSopy may change, p points to the allocated memory */
Stmt->Query.allocated= Stmt->Query.RefinedText= strndup(OriginalQuery, OriginalLength);
if (Stmt->Query.allocated == NULL)
{
return 1;
}
Stmt->Query.RefinedLength= OriginalLength;
Stmt->Query.BatchAllowed= DSN_OPTION(Stmt->Connection, MADB_OPT_FLAG_MULTI_STATEMENTS) ? '\1' : '\0';
Stmt->Query.AnsiQuotes= MADB_SqlMode(Stmt->Connection, MADB_ANSI_QUOTES);
Stmt->Query.NoBackslashEscape= MADB_SqlMode(Stmt->Connection, MADB_NO_BACKSLASH_ESCAPES);
}
return 0;
}
void MADB_DeleteSubqueries(MADB_QUERY * Query)
{
unsigned int i;
SINGLE_QUERY SubQuery;
for (i= 0; i < Query->SubQuery.elements; ++i)
{
MADB_GetDynamic(&Query->SubQuery, (char *)&SubQuery, i);
MADB_DeleteDynamic(&SubQuery.ParamPos);
}
MADB_DeleteDynamic(&Query->SubQuery);
}
void MADB_AddSubQuery(MADB_QUERY * Query, char * SubQueryText, enum enum_madb_query_type QueryType)
{
SINGLE_QUERY SubQuery;
SubQuery.QueryText= SubQueryText;
SubQuery.QueryType= QueryType;
MADB_InitDynamicArray(&SubQuery.ParamPos, sizeof(unsigned int), 20, 20);
MADB_InsertDynamic(&Query->SubQuery, (char*)&SubQuery);
}
void MADB_DeleteQuery(MADB_QUERY *Query)
{
MADB_FREE(Query->allocated);
MADB_FREE(Query->Original);
MADB_DeleteDynamic(&Query->Tokens);
MADB_DeleteSubqueries(Query);
memset(Query, 0, sizeof(MADB_QUERY));
}
int MADB_ParseQuery(MADB_QUERY * Query)
{
/* make sure we don't have trailing whitespace or semicolon */
Query->RefinedLength= SqlRtrim(Query->RefinedText, (int)Query->RefinedLength);
Query->RefinedText= ltrim(Query->RefinedText);
Query->RefinedText= FixIsoFormat(Query->RefinedText, &Query->RefinedLength);
Query->RefinedLength-= Query->RefinedText - Query->allocated;
/* Making copy of "original" string, with minimal changes required to be able to execute */
Query->Original= strndup(Query->RefinedText, Query->RefinedLength);
SkipSpacesAndComments(&Query->RefinedText, &Query->RefinedLength, FALSE);
return ParseQuery(Query);
}
/*----------------- Tokens stuff ------------------*/
char *MADB_Token(MADB_QUERY *Query, unsigned int Idx)
{
char *p;
unsigned int Offset= 0;
p= Query->RefinedText;
if (!Query->Tokens.elements || !p)
return NULL;
if (Idx >= Query->Tokens.elements)
return NULL;
MADB_GetDynamic(&Query->Tokens, (char *)&Offset, Idx);
return Query->RefinedText + Offset;
}
my_bool MADB_CompareToken(MADB_QUERY *Query, unsigned int Idx, char *Compare, size_t Length, unsigned int *Offset)
{
char *TokenString;
if (!(TokenString= MADB_Token(Query, Idx)))
return FALSE;
if (_strnicmp(TokenString, Compare, Length) == 0)
{
if (Offset)
*Offset= (unsigned int)(TokenString - Query->RefinedText);
return TRUE;
}
return FALSE;
}
/* Not used atm, but may be useful */
unsigned int MADB_FindToken(MADB_QUERY *Query, char *Compare)
{
unsigned int i, TokenCount= Query->Tokens.elements;
unsigned int Offset= 0;
for (i=0; i < TokenCount; i++)
{
if (MADB_CompareToken(Query, i, Compare, strlen(Compare), &Offset))
return Offset;
}
return 0;
}
static char * ParseCursorName(MADB_QUERY *Query, unsigned int *Offset)
{
unsigned int i, TokenCount= Query->Tokens.elements;
if (TokenCount < 4)
{
return NULL;
}
for (i=0; i < TokenCount - 3; i++)
{
if (MADB_CompareToken(Query, i, "WHERE", 5, Offset) &&
MADB_CompareToken(Query, i+1, "CURRENT", 7, 0) &&
MADB_CompareToken(Query, i+2, "OF", 2, 0))
{
return MADB_Token(Query, i + 3);
}
}
return NULL;
}
static char * PoorManCursorName(MADB_QUERY *Query, unsigned int *Offset)
{
MADB_QUERY EndPiece;
char *Res;
memset(&EndPiece, 0, sizeof(MADB_QUERY));
/* We do poor man on long queries only, thus there is no need to check length */
EndPiece.RefinedText= ltrim(Query->RefinedText + Query->RefinedLength - MADB_MAX_CURSOR_NAME - 32/* "WHERE CURRENT OF" + spaces */);
EndPiece.RefinedLength= strlen(EndPiece.RefinedText);
/* As we did poor man parsing, we don't have full information about the query. Thus, parsing only this part at the end of the query -
we need tockens, to check if we have WHERE CURRENT OF in usual way */
if (ParseQuery(&EndPiece))
{
return NULL;
}
/* Now looking for cursor name in usual way */
Res= ParseCursorName(&EndPiece, Offset);
/* Incrementing Offset with the offset of our part of the query */
if (Res != NULL)
{
*Offset= (unsigned int)(*Offset + EndPiece.RefinedText - Query->RefinedText);
}
MADB_DeleteQuery(&EndPiece);
return Res;
}
char * MADB_ParseCursorName(MADB_QUERY *Query, unsigned int *Offset)
{
if (Query->PoorManParsing)
{
return PoorManCursorName(Query, Offset);
}
return ParseCursorName(Query, Offset);
}
enum enum_madb_query_type MADB_GetQueryType(const char *Token1, const char *Token2)
{
/* We need for the case when MS Access adds parenthesis around query - see ODBC-57*/
while (*Token1 && !isalpha(*Token1))
++Token1;
if (_strnicmp(Token1, "SELECT", 6) == 0 || _strnicmp(Token1, "WITH", 4) == 0)
{
return MADB_QUERY_SELECT;
}
if (_strnicmp(Token1, "INSERT", 6) == 0 || _strnicmp(Token1, "REPLACE", 7) == 0)
{
return MADB_QUERY_INSERT;
}
if (_strnicmp(Token1, "UPDATE", 6) == 0)
{
return MADB_QUERY_UPDATE;
}
if (_strnicmp(Token1, "DELETE", 6) == 0)
{
return MADB_QUERY_DELETE;
}
if (_strnicmp(Token1, "CALL", 4) == 0)
{
return MADB_QUERY_CALL;
}
if (_strnicmp(Token1, "SHOW", 4) == 0)
{
return MADB_QUERY_SHOW;
}
if (_strnicmp(Token1, "ANALYZE", 7) == 0)
{
return MADB_QUERY_ANALYZE;
}
if (_strnicmp(Token1, "EXPLAIN", 7) == 0)
{
return MADB_QUERY_EXPLAIN;
}
if (_strnicmp(Token1, "CHECK", 5) == 0)
{
return MADB_QUERY_CHECK;
}
if (_strnicmp(Token1, "EXECUTE", 7) == 0)
{
return MADB_QUERY_EXECUTE;
}
if (_strnicmp(Token1, "CREATE", 6) == 0)
{
if (_strnicmp(Token2, "PROCEDURE", 9) == 0)
{
return MADB_QUERY_CREATE_PROC;
}
if (_strnicmp(Token2, "FUNCTION", 8) == 0)
{
return MADB_QUERY_CREATE_FUNC;
}
if (_strnicmp(Token2, "DEFINER", 7) == 0)
{
return MADB_QUERY_CREATE_DEFINER;
}
}
if (_strnicmp(Token1, "SET", 3) == 0)
{
if (_strnicmp(Token2, "NAMES", 5) == 0)
{
return MADB_QUERY_SET_NAMES;
}
else
{
return MADB_QUERY_SET;
}
}
if (_strnicmp(Token1, "DESC", 4) == 0)
{
return MADB_QUERY_DESCRIBE;
}
if (_strnicmp(Token1, "PREPARE", strlen("PREPARE")) == 0)
{
return MADB_QUERY_PREPARE;
}
if (_strnicmp(Token1, "BEGIN", 5) == 0 && _strnicmp(Token2, "NOT", 3) == 0)
{
return MADB_NOT_ATOMIC_BLOCK;
}
return MADB_QUERY_NO_RESULT;
}
/* -------------------- Tokens - End ----------------- */
/* Not used - rather a placeholder in case we need it */
const char * MADB_FindParamPlaceholder(MADB_Stmt *Stmt)
{
return STMT_STRING(Stmt);
}
/* Function assumes that query string has been trimmed */
char* FixIsoFormat(char * StmtString, size_t *Length)
{
if (*Length > 0 && StmtString[0] == '{' && StmtString[*Length -1] == '}')
{
char *Res;
++StmtString;
StmtString[*Length - 1]= '\0';
Res= trim(StmtString);
*Length= strlen(Res);
return Res;
}
return StmtString;
}
#define SAVE_TOKEN(PTR2SAVE) do { Offset= (unsigned int)(PTR2SAVE - Query->RefinedText);\
MADB_InsertDynamic(&Query->Tokens, (char*)&Offset); } while(0)
static BOOL ShouldWeTryPoorManParsing(MADB_QUERY *Query)
{
return (Query->RefinedLength > QUERY_LEN_FOR_POOR_MAN_PARSING) && (strchr(Query->RefinedText, ';')) == NULL && (strchr(Query->RefinedText, '?') == NULL);
}
int ParseQuery(MADB_QUERY *Query)
{
char *p= Query->RefinedText, Quote;
BOOL ReadingToken= FALSE;
unsigned int Offset, StmtTokensCount= 0;
size_t Length= Query->RefinedLength;
char *end= p + Length, *CurQuery= NULL, *LastSemicolon= NULL;
enum enum_madb_query_type StmtType;
MADB_InitDynamicArray(&Query->Tokens, (unsigned int)sizeof(unsigned int), (unsigned int)MAX(Length/32, 20), (unsigned int)MAX(Length/20, 40));
MADB_InitDynamicArray(&Query->SubQuery, (unsigned int)sizeof(SINGLE_QUERY), (unsigned int)MAX(Length/64, 20), (unsigned int)MAX(Length/64, 40));
Query->PoorManParsing= ShouldWeTryPoorManParsing(Query);
while (p < end)
{
if (ReadingToken == FALSE)
{
Length= end - p;
SkipSpacesAndComments(&p, &Length, TRUE);
SAVE_TOKEN(p);
++StmtTokensCount;
ReadingToken= TRUE;
/* On saving 1st statement's token, we are incrementing statements counter */
if (StmtTokensCount == 1)
{
CurQuery= p;
}
/* Having 2 first tockens we can get statement type. And we need to know it for the case of multistatement -
some statements may "legally" contain ';' */
else if (StmtTokensCount == 2)
{
/* We are currently at 2nd token of statement, and getting previous token position from Tokens array*/
StmtType= MADB_GetQueryType(MADB_Token(Query, Query->Tokens.elements - 2), p);
Query->ReturnsResult= Query->ReturnsResult || !QUERY_DOESNT_RETURN_RESULT(StmtType);
MADB_AddSubQuery(Query, CurQuery, StmtType);
/* If we on first statement, setting QueryType*/
if (Query->Tokens.elements == 2)
{
Query->QueryType= StmtType;
if (Query->PoorManParsing)
{
return 0;
}
}
}
switch (*p)
{
/* If some of them is opening a string, on the fall-through next `quote` won't be set,
as STRING_OR_COMMENT will be `true`. Likewise, if we are already in the string. But if we get hear,
we are not supposed to be inside a string */
case '"':
case '\'':
case '`':
{
char *SavePosition;
Quote= *p++;
SavePosition= p; /* In case we go past eos while looking for ending quote */
if (Query->NoBackslashEscape || Quote == '"' || /* Backtick works with ANSI_QUOTES */
(Query->AnsiQuotes && Quote == '"'))/* In indetifier quotation backslash does not escape anything - CLI has error with that */
{
SkipQuotedString_Noescapes(&p, end, Quote);
}
else
{
SkipQuotedString(&p, end, Quote);
}
if (p >= end)
{
/* Basically we got ending quote here - possible in poor man case, when we look for cursor name starting from the position inside string.
Other options are bad query of parsing error */
p= SavePosition;
ReadingToken= FALSE;
}
break;
}
case '?': /* This can break token(w/out space char), and be beginning of a token.
Thus we need it in both places */
if (Query->QueryType != MADB_QUERY_PREPARE) {
Query->HasParameters= 1;
/* Parameter placeholder is a complete token. And next one may begin right after it*/
ReadingToken= FALSE;
}
break;
case ';':
if (QueryIsPossiblyMultistmt(Query))
{
/* If batches are not allowed, we only need the fact, that this is multi-statement */
if (Query->BatchAllowed)
{
*p= '\0';
}
StmtTokensCount= 0;
}
ReadingToken= FALSE;
/* We should not move pointer here */
break;
}
}
else
{
switch (*p)
{
case '?':
case '"':
case '\'':
case '`':
case ' ':
case '\t':
case '\r':
case '\n':
case '-':
case '#':
case '/':
case ';':
ReadingToken= FALSE;
/* We should not move pointer here, since this can be already beginning of new token */
continue;
default:
break;
}
}
++p;
}
return 0;
}
char * StripLeadingComments(char *Str, size_t *Length, BOOL OverWrite)
{
char *Res= Str;
int ClosingStrLen= 1;
/* There is nothing to strip for sure */
if (*Length == 0)
{
return Str;
}
if (strncmp(Str, "--", 2) == 0)
{
Res= strchr(Str + 2, '\n');
}
else if (*Str == '#')
{
Res= strchr(Str + 1, '\n');
}
else if (strncmp(Str, "/*", 2) == 0)
{
Res= strstr(Str + 2, "*/");
ClosingStrLen= 2;
}
if (Res != Str)
{
if (Res != NULL)
{
Res+= ClosingStrLen;
*Length-= Res - Str;
}
else /* We found comment opening string, but did not find the closing string */
{
/* Thus moving pointer to the end of the string */
Res= Str + *Length;
*Length= 0;
}
/* On request - overwriting comment with white spaces */
if (OverWrite)
{
memset(Str, ' ', Res - Str);
}
}
return Res;
}
C
1
https://gitee.com/openlookeng/hetu-odbc-driver.git
git@gitee.com:openlookeng/hetu-odbc-driver.git
openlookeng
hetu-odbc-driver
hetu-odbc-driver
master

搜索帮助