/** * WinPR: Windows Portable Runtime * Process Argument Vector Functions * * Copyright 2013 Marc-Andre Moreau * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #ifdef HAVE_CONFIG_H #include "config.h" #endif #include #include #include #include #ifdef HAVE_UNISTD_H #include #endif #include "../log.h" #define TAG WINPR_TAG("thread") /** * CommandLineToArgvW function: * http://msdn.microsoft.com/en-us/library/windows/desktop/bb776391/ * * CommandLineToArgvW has a special interpretation of backslash characters * when they are followed by a quotation mark character ("), as follows: * * 2n backslashes followed by a quotation mark produce n backslashes followed by a quotation mark. * (2n) + 1 backslashes followed by a quotation mark again produce n backslashes followed by a quotation mark. * n backslashes not followed by a quotation mark simply produce n backslashes. * * The address returned by CommandLineToArgvW is the address of the first element in an array of LPWSTR values; * the number of pointers in this array is indicated by pNumArgs. Each pointer to a null-terminated Unicode * string represents an individual argument found on the command line. * * CommandLineToArgvW allocates a block of contiguous memory for pointers to the argument strings, * and for the argument strings themselves; the calling application must free the memory used by the * argument list when it is no longer needed. To free the memory, use a single call to the LocalFree function. */ /** * Parsing C++ Command-Line Arguments: * http://msdn.microsoft.com/en-us/library/windows/desktop/17w5ykft * * Microsoft C/C++ startup code uses the following rules when * interpreting arguments given on the operating system command line: * * Arguments are delimited by white space, which is either a space or a tab. * * The caret character (^) is not recognized as an escape character or delimiter. * The character is handled completely by the command-line parser in the operating * system before being passed to the argv array in the program. * * A string surrounded by double quotation marks ("string") is interpreted as a * single argument, regardless of white space contained within. A quoted string * can be embedded in an argument. * * A double quotation mark preceded by a backslash (\") is interpreted as a * literal double quotation mark character ("). * * Backslashes are interpreted literally, unless they immediately * precede a double quotation mark. * * If an even number of backslashes is followed by a double quotation mark, * one backslash is placed in the argv array for every pair of backslashes, * and the double quotation mark is interpreted as a string delimiter. * * If an odd number of backslashes is followed by a double quotation mark, * one backslash is placed in the argv array for every pair of backslashes, * and the double quotation mark is "escaped" by the remaining backslash, * causing a literal double quotation mark (") to be placed in argv. * */ LPSTR* CommandLineToArgvA(LPCSTR lpCmdLine, int* pNumArgs) { char* p; int index; int length; char* pBeg; char* pEnd; char* buffer; char* pOutput; int numArgs; LPSTR* pArgs; int maxNumArgs; int maxBufferSize; int currentIndex; int cmdLineLength; BOOL* lpEscapedChars; LPSTR lpEscapedCmdLine; if (!lpCmdLine) return NULL; if (!pNumArgs) return NULL; pArgs = NULL; numArgs = 0; lpEscapedCmdLine = NULL; cmdLineLength = strlen(lpCmdLine); lpEscapedChars = (BOOL*) calloc(1, (cmdLineLength + 1) * sizeof(BOOL)); if (!lpEscapedChars) return NULL; if (strstr(lpCmdLine, "\\\"")) { int i, n; char* pLastEnd = NULL; lpEscapedCmdLine = (char*) malloc((cmdLineLength + 1) * sizeof(char)); if (!lpEscapedCmdLine) { free(lpEscapedChars); return NULL; } p = (char*) lpCmdLine; pLastEnd = (char*) lpCmdLine; pOutput = (char*) lpEscapedCmdLine; while (p < &lpCmdLine[cmdLineLength]) { pBeg = strstr(p, "\\\""); if (!pBeg) { length = strlen(p); CopyMemory(pOutput, p, length); pOutput += length; p += length; break; } pEnd = pBeg + 2; while (pBeg >= lpCmdLine) { if (*pBeg != '\\') { pBeg++; break; } pBeg--; } n = (pEnd - pBeg) - 1; length = (pBeg - pLastEnd); CopyMemory(pOutput, p, length); pOutput += length; p += length; for (i = 0; i < (n / 2); i++) { *pOutput = '\\'; pOutput++; } p += n + 1; if ((n % 2) != 0) lpEscapedChars[pOutput - lpEscapedCmdLine] = TRUE; *pOutput = '"'; pOutput++; pLastEnd = p; } *pOutput = '\0'; pOutput++; lpCmdLine = (LPCSTR) lpEscapedCmdLine; cmdLineLength = strlen(lpCmdLine); } maxNumArgs = 2; currentIndex = 0; p = (char*) lpCmdLine; while (currentIndex < cmdLineLength - 1) { index = strcspn(p, " \t"); currentIndex += (index + 1); p = (char*) &lpCmdLine[currentIndex]; maxNumArgs++; } maxBufferSize = (maxNumArgs * (sizeof(char*))) + (cmdLineLength + 1); buffer = (char*) HeapAlloc(GetProcessHeap(), HEAP_ZERO_MEMORY, maxBufferSize); if (!buffer) return NULL; pArgs = (LPSTR*) buffer; pOutput = (char*) &buffer[maxNumArgs * (sizeof(char*))]; numArgs = 0; currentIndex = 0; p = (char*) lpCmdLine; while (currentIndex < cmdLineLength) { pBeg = pEnd = p; while (1) { index = strcspn(p, " \t\"\0"); if ((p[index] == '"') && (lpEscapedChars[&p[index] - lpCmdLine])) { p = &p[index + 1]; continue; } break; } if (p[index] != '"') { /* no whitespace escaped with double quotes */ p = &p[index + 1]; pEnd = p - 1; length = (pEnd - pBeg); CopyMemory(pOutput, pBeg, length); pOutput[length] = '\0'; pArgs[numArgs++] = pOutput; pOutput += (length + 1); } else { p = &p[index + 1]; while (1) { index = strcspn(p, "\"\0"); if ((p[index] == '"') && (lpEscapedChars[&p[index] - lpCmdLine])) { p = &p[index + 1]; continue; } break; } if (p[index] != '"') { WLog_ERR(TAG, "parsing error: uneven number of unescaped double quotes!"); } if (p[index] == '\0') { p = &p[index + 1]; pEnd = p - 1; } else { p = &p[index + 1]; index = strcspn(p, " \t\0"); p = &p[index + 1]; pEnd = p - 1; } length = 0; pArgs[numArgs++] = pOutput; while (pBeg < pEnd) { if (*pBeg != '"') { *pOutput = *pBeg; pOutput++; length++; } pBeg++; } *pOutput = '\0'; pOutput++; } while ((*p == ' ') || (*p == '\t')) p++; currentIndex = (p - lpCmdLine); } if (lpEscapedCmdLine) free(lpEscapedCmdLine); if (lpEscapedChars) free(lpEscapedChars); *pNumArgs = numArgs; return pArgs; } #ifndef _WIN32 LPWSTR* CommandLineToArgvW(LPCWSTR lpCmdLine, int* pNumArgs) { return NULL; } #endif