Source code of Windows XP (NT5)
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

1986 lines
51 KiB

  1. /*
  2. A hack to look in source files for "sharing hazards",
  3. very simple code patterns that should be examined to determine
  4. if multiple versions of the code can live "side-by-side".
  5. Problems are explicit unversioned sharing.
  6. Registry writes.
  7. File system writes.
  8. Naming of objects (kernel objects) -- open or create.
  9. */
  10. /*
  11. UNDONE and BUGS
  12. preprocessor directives are ignored
  13. the behavior of mbcs in strings and comments is not quite determinate
  14. there is not yet anyway to quash warnings
  15. backslash line continuation is not implemented, nor are trigraphs (trigraphs can produce
  16. # and \ for preprocessor directives or line continuation)
  17. no unicode support
  18. no \u support
  19. not quite tolerant of embedded nuls in file, but almost now
  20. some inefficiency
  21. some uncleanliness
  22. the reuse of the comment stripper isn't quite right
  23. the global line tracking isn't ver effiecent, but works
  24. @owner a-JayK
  25. */
  26. /\
  27. *
  28. BUG line continuation
  29. *\
  30. /
  31. /\
  32. / not honored
  33. /* The VC6 editor does not highlight the above correctly, but
  34. the compiler implements it correctly. */
  35. #pragma warning(disable:4786) /* long names in debug info truncated */
  36. #pragma warning(disable:4018) /* signed/unsigned */
  37. #include "MinMax.h"
  38. /* notice how good VC's support of trigraphs and line continuation is */
  39. ??=include <st??/
  40. dio.h>
  41. #include <stdlib.h>
  42. #include <string.h>
  43. #include <ctype.h>
  44. #incl\
  45. ude "windows.h"
  46. #define NUMBER_OF(x) (sizeof(x)/sizeof((x)[0]))
  47. #include "Casts.h"
  48. void CheckHresult(HRESULT);
  49. void ThrowHresult(HRESULT);
  50. #include "Handle.h"
  51. #include "comdef.h"
  52. #include <algorithm>
  53. #include <string>
  54. #include <vector>
  55. #include <set>
  56. #include <stack>
  57. #include <iostream>
  58. typedef struct HazardousFunction HazardousFunction;
  59. typedef int (__cdecl* QsortFunction)(const void*, const void*);
  60. typedef int (__cdecl* BsearchFunction)(const void*, const void*);
  61. class CLine;
  62. class CClass;
  63. enum ETokenType;
  64. /* get msvcrt.dll wildcard processing, doesn't work with libc.lib */
  65. //extern
  66. //#if defined(__cplusplus)
  67. //"C"
  68. //#endif
  69. //int _dowildcard = 1;
  70. const char* CheckCreateObject(const CClass&);
  71. const char* CheckCreateFile(const CClass&);
  72. const char* CheckRegOpenEx(const CClass&);
  73. void PrintOpenComment();
  74. void PrintCloseComment();
  75. void PrintSeperator();
  76. unsigned short StringLeadingTwoCharsTo14Bits(const char* s);
  77. void __stdcall CheckHresult(HRESULT hr)
  78. {
  79. if (FAILED(hr))
  80. ThrowHresult(hr);
  81. }
  82. void __stdcall ThrowHresult(HRESULT hr)
  83. {
  84. throw _com_error(hr, NULL);
  85. }
  86. const char banner[] = "SharingHazardCheck version " __DATE__ " " __TIME__ "\n";
  87. const char usage[]=
  88. "%s [options directories files]\n"
  89. "version: " __DATE__ " " __TIME__ "\n"
  90. "\n"
  91. "Options may appear in any order; command line is order independent\n"
  92. "Wildcards are accepted for filenames. Wildcards never match directories.\n"
  93. "\n"
  94. "default output format\n"
  95. " file(line):reason\n"
  96. "-recurse\n"
  97. "-print-line\n"
  98. " prints line of code with offending function after file(line):reason\n"
  99. "-print-statement\n"
  100. " print statement containing offending function after file(line):reason\n"
  101. " supersedes -print-line\n"
  102. //"-print-context-lines:n\n"
  103. //" -print-statement plus surrounding n lines (not implemented)\n"
  104. "-print-context-statements:n (n is 1-4, pinned at 4, 0 untested)\n"
  105. " -print-statement plus surrounding n \"statements\"\n"
  106. "file names apply across all directories recursed into\n"
  107. "wild cards apply across all directories recursed into\n"
  108. "naming a directory implies one level recursion (unless -recurse is also seen)\n"
  109. //"environment variable SHARING_HAZARD_CHECK_OPTIONS added to argv (not implemented)\n"
  110. "all directory walking happens before any output is generated, it is slow\n"
  111. "\n"
  112. "The way recursion and wildcards work might not be intuitive.\n";
  113. enum ETokenType
  114. {
  115. /* character values show up too including
  116. (), but probably not for any potentially multi char token like !=
  117. */
  118. eTokenTypeIdentifier = 128,
  119. eTokenTypeHazardousFunction,
  120. eTokenTypeStringConstant,
  121. eTokenTypeCharConstant,
  122. eTokenTypeNumber, /* floating point or integer, we don't care */
  123. eTokenTypePreprocessorDirective /* the entire line is one token */
  124. };
  125. class CLine
  126. {
  127. public:
  128. CLine() : m_start(0), m_number(1)
  129. {
  130. }
  131. const char* m_start;
  132. int m_number;
  133. };
  134. class CRange
  135. {
  136. public:
  137. const char* begin;
  138. const char* end;
  139. };
  140. typedef CRange CStatement;
  141. class CClass
  142. {
  143. public:
  144. CClass();
  145. explicit CClass(const CClass&);
  146. void operator=(const CClass&);
  147. ~CClass() { }
  148. bool OpenFile(const char*);
  149. int GetCharacter();
  150. ETokenType GetToken();
  151. /* public */
  152. const char* m_tokenText; /* only valid for identifiers */
  153. int m_tokenLength; /* only valid for identifiers */
  154. ETokenType m_eTokenType;
  155. HazardousFunction* m_hazardousFunction;
  156. /* semi private */
  157. const char* m_begin; // used to issue warnings for copied/sub scanners
  158. const char* m_str; // current position
  159. const char* m_end; // usually end of file, sometimes earlier ("just past")
  160. bool m_fPoundIsPreprocessor; // is # a preprocessor directive?
  161. int m_spacesSinceNewline; /* FUTURE deduce indentation style */
  162. bool m_fInComment; // if we return newlines within comments.. (we don't)
  163. char m_rgchUnget[16]; /* UNDONE this is bounded to like 1 right? */
  164. int m_nUnget;
  165. void NoteStatementStart(const char*);
  166. // a statement is simply code delimited by semicolons,
  167. // we are confused by if/while/do/for
  168. mutable CStatement m_statements[4];
  169. mutable unsigned m_istatement;
  170. bool ScanToCharacter(int ch);
  171. const char* ScanToFirstParameter();
  172. const char* ScanToNextParameter();
  173. const char* ScanToNthParameter(int);
  174. int CountParameters() const; // negative if unable to "parse"
  175. const char* ScanToLastParameter();
  176. const char* ScanToSecondFromLastParameter();
  177. const char* SpanEnd(const char* set) const;
  178. bool FindString(const char*) const;
  179. CLine m_line;
  180. CLine m_nextLine; /* hack.. */
  181. void Warn(const char* = "") const;
  182. void PrintCode() const;
  183. // bool m_fPrintContext;
  184. // bool m_fPrintFullStatement;
  185. bool m_fPrintCarets;
  186. void RecordStatement(int ch);
  187. void OrderStatements() const;
  188. const char* m_statementStart;
  189. char m_fullPath[MAX_PATH];
  190. private:
  191. int GetCharacter2();
  192. void UngetCharacter2(int ch);
  193. CFusionFile m_file;
  194. CFileMapping m_fileMapping;
  195. CMappedViewOfFile m_view;
  196. };
  197. class CSharingHazardCheck
  198. {
  199. public:
  200. CSharingHazardCheck();
  201. void Main(int argc, char** argv);
  202. void ProcessArgs(int argc, char** argv, std::vector<std::string>& files);
  203. int ProcessFile(const std::string&);
  204. // bool m_fRecurse;
  205. // int m_nPrintContextStatements;
  206. };
  207. int g_nPrintContextStatements = 0;
  208. bool g_fPrintFullStatement = true;
  209. bool g_fPrintLine = true;
  210. CSharingHazardCheck app;
  211. CSharingHazardCheck::CSharingHazardCheck()
  212. //:
  213. // m_fRecurse(false),
  214. // m_nPrintContextStatements(0)
  215. {
  216. }
  217. template <typename Iterator1, typename T>
  218. Iterator1 __stdcall SequenceLinearFindValue(Iterator1 begin, Iterator1 end, T value)
  219. {
  220. for ( ; begin != end && *begin != value ; ++begin)
  221. {
  222. /* nothing */
  223. }
  224. return begin;
  225. }
  226. template <typename Iterator1, typename Iterator2>
  227. long __stdcall SequenceLengthOfSpanIncluding(Iterator1 begin, Iterator1 end, Iterator2 setBegin, Iterator2 setEnd)
  228. {
  229. long result = 0;
  230. while (begin != end && SequenceLinearFindValue(setBegin, setEnd, *begin) != setEnd)
  231. {
  232. ++begin;
  233. ++result;
  234. }
  235. return result;
  236. }
  237. template <typename Iterator1, typename Iterator2>
  238. long __stdcall SequenceLengthOfSpanExcluding(Iterator1 begin, Iterator1 end, Iterator2 setBegin, Iterator2 setEnd)
  239. {
  240. long result = 0;
  241. while (begin != end && SequenceLinearFindValue(setBegin, setEnd, *begin) == setEnd)
  242. {
  243. ++begin;
  244. ++result;
  245. }
  246. return result;
  247. }
  248. #define CASE_AZ \
  249. case 'A':case 'B':case 'C':case 'D':case 'E':case 'F':case 'G':case 'H':case 'I': \
  250. case 'J':case 'K':case 'L':case 'M':case 'N':case 'O':case 'P':case 'Q':case 'R': \
  251. case 'S':case 'T':case 'U':case 'V':case 'W':case 'X':case 'Y':case 'Z'
  252. #define CASE_az \
  253. case 'a':case 'b':case 'c':case 'd':case 'e':case 'f':case 'g':case 'h':case 'i': \
  254. case 'j':case 'k':case 'l':case 'm':case 'n':case 'o':case 'p':case 'q':case 'r': \
  255. case 's':case 't':case 'u':case 'v':case 'w':case 'x':case 'y':case 'z'
  256. #define CASE_09 \
  257. case '0':case '1':case '2':case '3':case '4': \
  258. case '5':case '6':case '7':case '8':case '9'
  259. /* try to keep character set stuff somewhat centralized */
  260. #define CASE_HORIZONTAL_SPACE case ' ': case '\t'
  261. // 0x1a is control-z; it probably marks end of file, but it's pretty rare
  262. // and usually followed by end of file, so we just treat it as vertical space
  263. #define CASE_VERTICAL_SPACE case '\n': case '\r': case 0xc: case 0x1a
  264. #define CASE_SPACE CASE_HORIZONTAL_SPACE: CASE_VERTICAL_SPACE
  265. #define VERTICAL_SPACE "\n\r\xc\x1a"
  266. #define HORIZONTAL_SPACE " \t"
  267. #define SPACE HORIZONTAL_SPACE VERTICAL_SPACE
  268. bool IsVerticalSpace(int ch) { return (ch == '\n' || ch == '\r' || ch == 0xc || ch == 0x1a); }
  269. bool IsHorizontalSpace(int ch) { return (ch == ' ' || ch == '\t'); }
  270. bool IsSpace(int ch) { return IsHorizontalSpace(ch) || IsVerticalSpace(ch); }
  271. #define DIGITS10 "0123456789"
  272. #define DIGITS_EXTRA_HEX "abcdefABCDEFxX"
  273. #define DIGITS_EXTRA_TYPE "uUlLfFDd" /* not sure about fFdD for float/double */
  274. #define DIGITS_EXTRA_FLOAT "eE."
  275. const char digits10[] = DIGITS10;
  276. #define DIGITS_ALL DIGITS10 DIGITS_EXTRA_TYPE DIGITS_EXTRA_HEX DIGITS_EXTRA_FLOAT
  277. const char digitsAll[] = DIGITS_ALL;
  278. #define UPPER_LETTERS "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
  279. #define LOWER_LETTERS "abcdefghijklmnopqrstuvwxyz"
  280. #define IDENTIFIER_CHARS UPPER_LETTERS LOWER_LETTERS DIGITS10 "_"
  281. const char upperLetters[] = UPPER_LETTERS;
  282. const char lowerLetters[] = LOWER_LETTERS;
  283. const char identifierChars[] = IDENTIFIER_CHARS;
  284. #define JAYK 0
  285. #if JAYK
  286. #if _M_IX86
  287. #define BreakPoint() __asm { int 3 }
  288. #else
  289. #define BreakPoint() DebugBreak()
  290. #endif
  291. #else
  292. #define BreakPoint() /* nothing */
  293. #endif
  294. /* actually..these don't work unless we #undef what windows.h gives us ..
  295. #define STRINGIZE_EVAL_AGAIN(name) #name
  296. #define STRINGIZE(name) STRINGIZE_EVAL_AGAIN(name)
  297. #define PASTE_EVAL_AGAIN(x,y) x##y
  298. #define PASTE(x,y) PASTE_EVAL_AGAIN(x,y)
  299. #define STRINGIZE_A(x) STRINGIZE(PASTE(x,A))
  300. #define STRINGIZE_W(x) STRINGIZE(PASTE(x,W))
  301. */
  302. bool fReturnNewlinesInComments = false; /* untested */
  303. const char szOpenNamedObject[] = "Open Named Object";
  304. const char szCreateNamedObject[] = "Create Named Object";
  305. const char szRegistryWrite[] = "Registry Write";
  306. const char szFileWrite[] = "File Write";
  307. const char szRegOpenNotUnderstood[] = "RegOpen parameters not understood";
  308. const char szRegisteryRead[] = "Registry Read";
  309. const char szCOM1[] = "CoRegisterClassObject";
  310. const char szCOM2[] = "CoRegisterPSClsid";
  311. const char szOpenFile[] = "File I/O";
  312. const char szLOpen[] = "File I/O"; // UNDONE look at the access parameter
  313. const char szStructuredStorage[] = "Structured Storage I/O"; // UNDONE look at the access parameter
  314. const char szQueryWindowClass[] = "Query Window Class Info";
  315. const char szCreateWindowClass[] = "Create Window Class";
  316. const char szAtom[] = "Atom stuff";
  317. const char szRegisterWindowMessage[] = "Register Window Message";
  318. const char szCreateFileNotUnderstood[] = "CreateFile parameters not understood";
  319. const char szCreateObjectNotUnderstood[] = "Create object parameters not understood";
  320. const char szSetEnvironmentVariable[] = "Set Environment Variable";
  321. const char szWriteEventLog[] = "Event Log Write";
  322. struct HazardousFunction
  323. {
  324. const char* api;
  325. const char* message;
  326. const char* (*function)(const CClass&);
  327. int apiLength;
  328. //__int64 pad;
  329. };
  330. HazardousFunction hazardousFunctions[] =
  331. {
  332. #define HAZARDOUS_FUNCTION_AW3(api, x, y) \
  333. /* if we evaluate again, we pick up the macros from windows.h .. */ \
  334. { # api, x, y }, \
  335. { # api "A", x, y }, \
  336. { # api "W", x, y }
  337. #define HAZARDOUS_FUNCTION_AW2(api, x) \
  338. /* if we evaluate again, we pick up the macros from windows.h .. */ \
  339. { # api, x }, \
  340. { # api "A", x }, \
  341. { # api "W", x }
  342. #define HAZARDOUS_FUNCTION2(api, x ) \
  343. /* if we evaluate again, we pick up the macros from windows.h .. */ \
  344. { # api, x } \
  345. #define HAZARDOUS_FUNCTION3(api, x, y ) \
  346. /* if we evaluate again, we pick up the macros from windows.h .. */ \
  347. { # api, x, y } \
  348. /*--------------------------------------------------------------------------
  349. registry
  350. --------------------------------------------------------------------------*/
  351. HAZARDOUS_FUNCTION_AW2(RegCreateKey, szRegistryWrite),
  352. HAZARDOUS_FUNCTION_AW2(RegCreateKeyEx, szRegistryWrite),
  353. HAZARDOUS_FUNCTION_AW2(RegOpenKey, szRegistryWrite),
  354. // UNDONE check the access parameter
  355. HAZARDOUS_FUNCTION_AW3(RegOpenKeyEx, NULL, CheckRegOpenEx),
  356. HAZARDOUS_FUNCTION3(RegOpenUserClassesRoot, NULL, CheckRegOpenEx),
  357. HAZARDOUS_FUNCTION3(RegOpenCurrentUser, NULL, CheckRegOpenEx),
  358. //HAZARDOUS_FUNCTION_AW2(RegOpenKeyEx, szRegistryWrite),
  359. //HAZARDOUS_FUNCTION2(RegOpenUserClassesRoot, szRegistryWrite),
  360. // These don't require opening a key, they are legacy Win16 APIs
  361. HAZARDOUS_FUNCTION_AW2(RegSetValue, szRegistryWrite),
  362. // These are caught by the RegCreateKey or RegOpenKey with particular access.
  363. //HAZARDOUS_FUNCTION(RegSetValueEx, szReistryWrite),
  364. // SHReg* in shlwapi.dll
  365. HAZARDOUS_FUNCTION_AW2(SHRegCreateUSKey, szRegistryWrite),
  366. HAZARDOUS_FUNCTION_AW2(SHRegDeleteEmptyUSKey, szRegistryWrite),
  367. HAZARDOUS_FUNCTION_AW2(SHRegDeleteUSValue, szRegistryWrite),
  368. //UNDONEHAZARDOUS_FUNCTION_AW3(SHRegOpenUSKey, NULL, CheckSHRegOpen),
  369. HAZARDOUS_FUNCTION_AW2(SHRegSetPath, szRegistryWrite),
  370. HAZARDOUS_FUNCTION_AW2(SHRegSetUSValue, szRegistryWrite),
  371. // should be caught by OpenKey
  372. //HAZARDOUS_FUNCTION_AW2(SHRegWriteUSValue, szRegistryWrite),
  373. HAZARDOUS_FUNCTION_AW2(SetEnvironmentVariable, szSetEnvironmentVariable),
  374. /*--------------------------------------------------------------------------
  375. file i/o, esp. writing
  376. --------------------------------------------------------------------------*/
  377. HAZARDOUS_FUNCTION_AW3(CreateFile, NULL, CheckCreateFile),
  378. // legacy Win16 APIs. UNDONE check the access parameter, but
  379. // really any uses of these should be changed to CreateFile
  380. HAZARDOUS_FUNCTION2(OpenFile, szOpenFile),
  381. HAZARDOUS_FUNCTION2(_lopen, szLOpen),
  382. //HAZARDOUS_FUNCTION(fopen, szFOpen, CheckFOpen),
  383. /*--------------------------------------------------------------------------
  384. monikers
  385. --------------------------------------------------------------------------*/
  386. /*--------------------------------------------------------------------------
  387. structured storage
  388. --------------------------------------------------------------------------*/
  389. // UNDONE check the access parameter
  390. HAZARDOUS_FUNCTION2(StgOpenStorage, szStructuredStorage),
  391. HAZARDOUS_FUNCTION2(StgOpenStorageEx, szStructuredStorage),
  392. HAZARDOUS_FUNCTION2(StgCreateDocfile, szStructuredStorage),
  393. HAZARDOUS_FUNCTION2(StgCreateStorageEx, szStructuredStorage),
  394. /*--------------------------------------------------------------------------
  395. .exe servers / COM
  396. --------------------------------------------------------------------------*/
  397. HAZARDOUS_FUNCTION2(CoRegisterClassObject, szCOM1),
  398. HAZARDOUS_FUNCTION2(CoRegisterPSClsid, szCOM2),
  399. /*--------------------------------------------------------------------------
  400. named kernel objects
  401. --------------------------------------------------------------------------*/
  402. // Create named or anonymous, anonymous is not a hazard
  403. HAZARDOUS_FUNCTION_AW3(CreateDesktop, NULL, CheckCreateObject),
  404. HAZARDOUS_FUNCTION_AW3(CreateEvent, NULL, CheckCreateObject),
  405. HAZARDOUS_FUNCTION_AW3(CreateFileMapping, NULL, CheckCreateObject),
  406. HAZARDOUS_FUNCTION_AW3(CreateJobObject, NULL, CheckCreateObject),
  407. HAZARDOUS_FUNCTION_AW3(CreateMutex, NULL, CheckCreateObject),
  408. HAZARDOUS_FUNCTION_AW2(CreateMailslot, szOpenNamedObject), // never anonymous
  409. HAZARDOUS_FUNCTION_AW2(CreateNamedPipe, szOpenNamedObject), // never anonymous
  410. HAZARDOUS_FUNCTION_AW3(CreateSemaphore, NULL, CheckCreateObject),
  411. HAZARDOUS_FUNCTION_AW3(CreateWaitableTimer, NULL, CheckCreateObject),
  412. HAZARDOUS_FUNCTION_AW3(CreateWindowStation, NULL, CheckCreateObject),
  413. // open by name
  414. HAZARDOUS_FUNCTION_AW2(OpenDesktop, szOpenNamedObject),
  415. HAZARDOUS_FUNCTION_AW2(OpenEvent, szOpenNamedObject),
  416. HAZARDOUS_FUNCTION_AW2(OpenFileMapping, szOpenNamedObject),
  417. HAZARDOUS_FUNCTION_AW2(OpenJobObject, szOpenNamedObject),
  418. HAZARDOUS_FUNCTION_AW2(OpenMutex, szOpenNamedObject),
  419. HAZARDOUS_FUNCTION_AW2(CallNamedPipe, szOpenNamedObject),
  420. HAZARDOUS_FUNCTION_AW2(OpenSemaphore, szOpenNamedObject),
  421. HAZARDOUS_FUNCTION_AW2(OpenWaitableTimer, szOpenNamedObject),
  422. HAZARDOUS_FUNCTION_AW2(OpenWindowStation, szOpenNamedObject),
  423. /*
  424. EnumProcesses?
  425. Toolhelp
  426. */
  427. /*--------------------------------------------------------------------------
  428. window classes
  429. --------------------------------------------------------------------------*/
  430. // Fusion should handle these automagically.
  431. // these two take a class name as a parameter
  432. #if 0
  433. // many false positives on typelib related stuff
  434. //HAZARDOUS_FUNCTION_AW2(GetClassInfo, szQueryWindowClass),
  435. #else
  436. // this still produces many false positives..
  437. //HAZARDOUS_FUNCTION_AW2(WNDCLASS, szQueryWindowClass),
  438. //HAZARDOUS_FUNCTION_AW2(WNDCLASSEX, szQueryWindowClass),
  439. #endif
  440. //HAZARDOUS_FUNCTION_AW2(GetClassInfoEx, szQueryWindowClass),
  441. // Fusion should handle these automagically.
  442. // this returns a class name
  443. // HAZARDOUS_FUNCTION_AW2(GetClassName, szQueryWindowClass),
  444. // Fusion should handle these automagically.
  445. // this creates classes
  446. //HAZARDOUS_FUNCTION_AW2(RegisterClass, szCreateWindowClass),
  447. //HAZARDOUS_FUNCTION_AW2(RegisterClassEx, szCreateWindowClass),
  448. /*--------------------------------------------------------------------------
  449. window messages
  450. --------------------------------------------------------------------------*/
  451. // We aren't convinced this is a problem.
  452. //HAZARDOUS_FUNCTION_AW2(RegisterWindowMessage, szRegisterWindowMessage),
  453. /*--------------------------------------------------------------------------
  454. atoms
  455. --------------------------------------------------------------------------*/
  456. HAZARDOUS_FUNCTION_AW2(AddAtom, szAtom),
  457. HAZARDOUS_FUNCTION_AW2(FindAtom, szAtom),
  458. HAZARDOUS_FUNCTION_AW2(GlobalAddAtom, szAtom),
  459. HAZARDOUS_FUNCTION_AW2(GlobalFindAtom, szAtom),
  460. /*
  461. InitAtomTable,
  462. DeleteAtom,
  463. GetAtomName,
  464. GlobalDeleteAtom,
  465. GlobalGetAtomName
  466. */
  467. /*--------------------------------------------------------------------------
  468. DDE?
  469. clipboard?
  470. --------------------------------------------------------------------------*/
  471. /*--------------------------------------------------------------------------
  472. Ole data transfer
  473. --------------------------------------------------------------------------*/
  474. HAZARDOUS_FUNCTION2(RegisterMediaTypeClass, szRegistryWrite),
  475. HAZARDOUS_FUNCTION2(RegisterMediaTypes, szRegistryWrite),
  476. HAZARDOUS_FUNCTION2(OleUICanConvertOrActivatfeAs, szRegisteryRead),
  477. HAZARDOUS_FUNCTION2(OleRegEnumFormatEtc, szRegisteryRead),
  478. HAZARDOUS_FUNCTION2(OleRegEnumVerbs, szRegisteryRead),
  479. /*--------------------------------------------------------------------------
  480. NT event log
  481. --------------------------------------------------------------------------*/
  482. HAZARDOUS_FUNCTION_AW2(RegisterEventSource, szRegistryWrite),
  483. HAZARDOUS_FUNCTION_AW2(ClearEventLog, szWriteEventLog),
  484. HAZARDOUS_FUNCTION_AW2(ReportEvent, szWriteEventLog),
  485. /*--------------------------------------------------------------------------
  486. UNDONE think about these
  487. HAZARDOUS_FUNCTION_AW2(CreateEnhMetaFile, szWriteGdiMetaFile),
  488. HAZARDOUS_FUNCTION_AW2(DeleteEnhMetaFile, szWriteGdiMetaFile),
  489. HAZARDOUS_FUNCTION_AW2(DeleteMetaFile, szWriteGdiMetaFile),
  490. HAZARDOUS_FUNCTION_AW2(CreateMetaFile, szWriteGdiMetaFile),
  491. HAZARDOUS_FUNCTION_AW2(DeleteFile, szWriteFileSystem),
  492. HAZARDOUS_FUNCTION_AW2(MoveFile, szWriteFileSystem),
  493. HAZARDOUS_FUNCTION_AW2(RemoveDirectory, szWriteFileSystem),
  494. HAZARDOUS_FUNCTION_AW2(ReplaceFile, szWriteFileSystem),
  495. RegDelete* (handled by RegOpen)
  496. SHReg* (?handled by open)
  497. CreateService OpenSCManager (not done)
  498. SetWindowsHook SetWindowsHookEx (not done)
  499. --------------------------------------------------------------------------*/
  500. };
  501. int __cdecl CompareHazardousFunction(const HazardousFunction* x, const HazardousFunction* y)
  502. {
  503. int i = 0;
  504. int minlength = 0;
  505. /* one of the strings is not nul terminated */
  506. if (x->apiLength == y->apiLength)
  507. {
  508. i = strncmp(x->api, y->api, x->apiLength);
  509. return i;
  510. }
  511. minlength = x->apiLength < y->apiLength ? x->apiLength : y->apiLength;
  512. i = strncmp(x->api, y->api, minlength);
  513. if (i != 0)
  514. return i;
  515. return (minlength == x->apiLength) ? -1 : +1;
  516. }
  517. bool leadingTwoCharsAs14Bits[1U<<14];
  518. void CClass::UngetCharacter2(int ch)
  519. {
  520. /* if you m_rgchUnget a newline, line numbers will get messed up
  521. we only m_rgchUnget forward slashes
  522. */
  523. m_rgchUnget[m_nUnget++] = static_cast<char>(ch);
  524. }
  525. int CClass::GetCharacter2()
  526. {
  527. int ch;
  528. m_line = m_nextLine; /* UNDONE clean this hack up */
  529. if (m_nUnget)
  530. {
  531. return m_rgchUnget[--m_nUnget];
  532. }
  533. /* undone break the nul termination dependency.. */
  534. if (m_str == m_end)
  535. return 0;
  536. ch = *m_str;
  537. m_str += 1;
  538. switch (ch)
  539. {
  540. /* it is for line continuation that this function is really needed.. */
  541. case '\\': /* line continuation not implemented */
  542. case '?': /* trigraphs not implemented */
  543. default:
  544. break;
  545. case 0xc: /* formfeed, control L, very common in NT source */
  546. ch = '\n';
  547. break;
  548. case '\t':
  549. ch = ' ';
  550. break;
  551. case '\r':
  552. ch = '\n';
  553. /* skip \n after \r */
  554. if (*m_str == '\n')
  555. m_str += 1;
  556. /* fall through */
  557. case '\n':
  558. m_nextLine.m_start = m_str;
  559. m_nextLine.m_number += 1;
  560. //if (m_nextLine.m_number == 92)
  561. //{
  562. // BreakPoint();
  563. //}
  564. break;
  565. }
  566. return ch;
  567. }
  568. int CClass::GetCharacter()
  569. {
  570. int ch;
  571. if (m_fInComment)
  572. goto Lm_fInComment;
  573. m_fInComment = false;
  574. ch = GetCharacter2();
  575. switch (ch)
  576. {
  577. default:
  578. goto Lret;
  579. case '/':
  580. ch = GetCharacter2();
  581. switch (ch)
  582. {
  583. default:
  584. UngetCharacter2(ch);
  585. ch = '/';
  586. goto Lret;
  587. case '/':
  588. while ((ch = GetCharacter2())
  589. && !IsVerticalSpace(ch))
  590. {
  591. /* nothing */
  592. }
  593. goto Lret; /* return the \n or 0*/
  594. case '*':
  595. Lm_fInComment:
  596. L2:
  597. ch = GetCharacter2();
  598. switch (ch)
  599. {
  600. case '\n':
  601. if (!fReturnNewlinesInComments)
  602. goto L2;
  603. m_fInComment = true;
  604. goto Lret;
  605. default:
  606. goto L2;
  607. case 0:
  608. /* unclosed comment at end of file, just return end */
  609. printf("unclosed comment\n");
  610. goto Lret;
  611. case '*':
  612. L1:
  613. ch = GetCharacter2();
  614. switch (ch)
  615. {
  616. default:
  617. goto L2;
  618. case 0:
  619. /* unclosed comment at end of file, just return end */
  620. printf("unclosed comment\n");
  621. goto Lret;
  622. case '/':
  623. ch = ' ';
  624. goto Lret;
  625. case '*':
  626. goto L1;
  627. }
  628. }
  629. }
  630. }
  631. Lret:
  632. return ch;
  633. }
  634. CClass::CClass(const CClass& that)
  635. {
  636. // yucky laziness
  637. memcpy(this, &that, sizeof(*this));
  638. // the copy must not outlive the original!
  639. // or we could DuplicateHandle the handles and make a new mapping..
  640. m_begin = that.m_str;
  641. m_file.Detach();
  642. m_fileMapping.Detach();
  643. m_view.Detach();
  644. }
  645. CClass::CClass()
  646. {
  647. // yucky laziness
  648. memset(this, 0, sizeof(*this));
  649. // m_fPrintContext = false;
  650. // m_fPrintFullStatement = true;
  651. m_fPrintCarets = false;
  652. m_fPoundIsPreprocessor = true;
  653. m_file.Detach();
  654. m_fileMapping.Detach();
  655. m_view.Detach();
  656. }
  657. ETokenType CClass::GetToken()
  658. {
  659. int i = 0;
  660. int ch = 0;
  661. unsigned twoCharsAs14Bits = 0;
  662. char ch2[3] = {0,0,0};
  663. HazardousFunction lookingForHazardousFunction;
  664. HazardousFunction* foundHazardousFunction;
  665. L1:
  666. ch = GetCharacter();
  667. switch (ch)
  668. {
  669. default:
  670. m_fPoundIsPreprocessor = false;
  671. break;
  672. CASE_VERTICAL_SPACE:
  673. m_fPoundIsPreprocessor = true;
  674. goto L1;
  675. case '#':
  676. break;
  677. CASE_HORIZONTAL_SPACE:
  678. goto L1;
  679. }
  680. switch (ch)
  681. {
  682. default:
  683. BreakPoint();
  684. printf("\n%s(%d): unhandled character %c, stopping processing this file\n", m_fullPath, m_line.m_number, ch);
  685. case 0:
  686. return INT_TO_ENUM_CAST(ETokenType)(0);
  687. break;
  688. /* FUTURE, we pick these up as bogus seperate tokens instead of doing
  689. line continuation */
  690. case '\\':
  691. return (m_eTokenType = INT_TO_ENUM_CAST(ETokenType)(ch));
  692. /* one character tokens */
  693. case '{': /* 0x7b to turn off editor interaction.. */
  694. case '}': /* 0x7D to turn off editor interaction.. */
  695. case '?': /* we don't handle trigraphs */
  696. case '[':
  697. case ']':
  698. case '(':
  699. case ',':
  700. case ')':
  701. case ';':
  702. return (m_eTokenType = INT_TO_ENUM_CAST(ETokenType)(ch));
  703. /* one two or three character tokens */
  704. case '.': /* . .* */
  705. case '<': /* < << <<= */
  706. case '>': /* > >> >>= */
  707. case '+': /* + ++ += */
  708. case '-': /* - -- -= -> ->* */
  709. case '*': /* * *= */ /* and ** in C9x */
  710. case '/': /* / /= */
  711. case '%': /* % %= */
  712. case '^': /* ^ ^= */
  713. case '&': /* & && &= */
  714. case '|': /* | || |= */
  715. case '~': /* ~ ~= */
  716. case '!': /* ! != */
  717. case ':': /* : :: */
  718. case '=': /* = == */
  719. /* just lie and return them one char at a time */
  720. return (m_eTokenType = INT_TO_ENUM_CAST(ETokenType)(ch));
  721. case '#':
  722. /* not valid in general, only if m_fPoundIsPreprocessor or actually in a #define,
  723. but we don't care */
  724. if (!m_fPoundIsPreprocessor)
  725. return (m_eTokenType = INT_TO_ENUM_CAST(ETokenType)(ch));
  726. /* lack of backslash line continuation makes the most difference here */
  727. while ((ch = GetCharacter()) && !IsVerticalSpace(ch))
  728. {
  729. /* nothing */
  730. }
  731. return (m_eTokenType = eTokenTypePreprocessorDirective);
  732. case '\'':
  733. /* NT uses multi char char constants..
  734. call GetCharacter2 instead of GetCharacter so that
  735. comments in char constants are not treated as comments */
  736. while ((ch = GetCharacter2()) && ch != '\'')
  737. {
  738. /* notice the bogosity, escapes are multiple characters,
  739. but \' is not, and that's all we care about skipping correctly */
  740. if (ch == '\\')
  741. GetCharacter2();
  742. }
  743. return (m_eTokenType = eTokenTypeCharConstant);
  744. case '\"':
  745. /* call GetCharacter2 instead of GetCharacter so that
  746. comments in string constants are not treated as comments */
  747. while ((ch = GetCharacter2()) && ch != '\"')
  748. {
  749. /* notice the bogosity, escapes are multiple characters,
  750. but \" is not, and that's all we care about skipping correctly */
  751. if (ch == '\\')
  752. GetCharacter2();
  753. }
  754. return (m_eTokenType = eTokenTypeStringConstant);
  755. CASE_09:
  756. /* integer or floating point, including hex,
  757. we ignore some invalid forms */
  758. m_str += SequenceLengthOfSpanIncluding(m_str, m_end, digitsAll, digitsAll+NUMBER_OF(digitsAll)-1);
  759. return (m_eTokenType = eTokenTypeNumber);
  760. case '$': /* non standard, used by NT */
  761. CASE_AZ:
  762. CASE_az:
  763. case '_':
  764. /* notice, keywords like if/else/while/class are just
  765. returned as identifiers, that is sufficient for now
  766. */
  767. i = SequenceLengthOfSpanIncluding(m_str, m_end, identifierChars, identifierChars+NUMBER_OF(identifierChars)-1);
  768. twoCharsAs14Bits = StringLeadingTwoCharsTo14Bits(m_str - 1);
  769. if (!leadingTwoCharsAs14Bits[twoCharsAs14Bits])
  770. goto LtokenIdentifier;
  771. lookingForHazardousFunction.api = m_str - 1;
  772. lookingForHazardousFunction.apiLength = i + 1;
  773. foundHazardousFunction = REINTERPRET_CAST(HazardousFunction*)(bsearch(&lookingForHazardousFunction, hazardousFunctions, NUMBER_OF(hazardousFunctions), sizeof(hazardousFunctions[0]), (BsearchFunction)CompareHazardousFunction));
  774. if (!foundHazardousFunction)
  775. goto LtokenIdentifier;
  776. m_tokenText = m_str - 1;
  777. m_tokenLength = i + 1;
  778. m_str += i;
  779. m_hazardousFunction = foundHazardousFunction;
  780. return (m_eTokenType = eTokenTypeHazardousFunction);
  781. LtokenIdentifier:
  782. m_tokenText = m_str - 1;
  783. m_tokenLength = i + 1;
  784. m_str += i;
  785. return (m_eTokenType = eTokenTypeIdentifier);
  786. }
  787. }
  788. /*
  789. This has the desired affect of skipping comments.
  790. FUTURE but it doesn't skip preprocessor directives because they
  791. are handled within ScannerGetToken.
  792. This is a bug if your code looks like
  793. CreateFile(GENERIC_READ|
  794. #include "foo.h"
  795. GENERIC_WRITE,
  796. ...
  797. );
  798. returning an int length here is problematic because of \r\n conversion..yuck.
  799. */
  800. const char* CClass::SpanEnd(const char* set) const
  801. {
  802. CClass s(*this);
  803. int ch;
  804. while ((ch = s.GetCharacter())
  805. && strchr(set, ch))
  806. {
  807. /* nothing */
  808. }
  809. return s.m_str;
  810. }
  811. bool CClass::ScanToCharacter(int ch)
  812. {
  813. int ch2;
  814. if (!ch)
  815. {
  816. return false;
  817. }
  818. while ((ch2 = GetCharacter()) && ch2 != ch)
  819. {
  820. /* nothing */
  821. }
  822. return (ch2 == ch);
  823. }
  824. /* This has the desired advantage over strstr of
  825. - skip comments
  826. - not depend on nul termination
  827. */
  828. bool CClass::FindString(const char* str) const
  829. {
  830. CClass s(*this);
  831. int ch;
  832. int ch0 = *str++;
  833. while (s.ScanToCharacter(ch0))
  834. {
  835. const char* str2 = str;
  836. CClass t(s);
  837. while (*str2 && (ch = t.GetCharacter()) && ch == *str2)
  838. {
  839. ++str2;
  840. }
  841. if (!*str2)
  842. return true;
  843. }
  844. return false;
  845. }
  846. unsigned short __stdcall StringLeadingTwoCharsTo14Bits(const char* s)
  847. {
  848. unsigned short result = s[0];
  849. result <<= 7;
  850. result |= result ? s[1] : 0;
  851. return result;
  852. }
  853. void __stdcall InitTables()
  854. {
  855. int i;
  856. for (i = 0 ; i != NUMBER_OF(hazardousFunctions) ; ++i)
  857. {
  858. leadingTwoCharsAs14Bits[StringLeadingTwoCharsTo14Bits(hazardousFunctions[i].api)] = true;
  859. hazardousFunctions[i].apiLength = strlen(hazardousFunctions[i].api);
  860. }
  861. qsort(&hazardousFunctions, i, sizeof(hazardousFunctions[0]), FUNCTION_POINTER_CAST(QsortFunction)(CompareHazardousFunction));
  862. }
  863. const char* CClass::ScanToFirstParameter()
  864. {
  865. // scan to left paren, but if we see right paren or semi first, return null
  866. // FUTURE count parens..
  867. int ch;
  868. while (ch = GetCharacter())
  869. {
  870. switch (ch)
  871. {
  872. default:
  873. break;
  874. case '(':
  875. return m_str;
  876. case ';':
  877. case ')':
  878. return 0;
  879. }
  880. }
  881. return 0;
  882. }
  883. const char* CClass::ScanToLastParameter()
  884. {
  885. const char* ret = 0;
  886. if (ScanToFirstParameter())
  887. {
  888. ret = m_str;
  889. while (ScanToNextParameter())
  890. {
  891. ret = m_str;
  892. }
  893. }
  894. return ret;
  895. }
  896. const char* CClass::ScanToNthParameter(int n)
  897. {
  898. const char* ret = 0;
  899. if (!(ret = ScanToFirstParameter()))
  900. return ret;
  901. while (n-- > 0 && (ret = ScanToNextParameter()))
  902. {
  903. /* nothing */
  904. }
  905. return ret;
  906. }
  907. int CClass::CountParameters() const
  908. {
  909. CClass s(*this);
  910. int result = 0;
  911. if (!s.ScanToFirstParameter())
  912. return result;
  913. ++result;
  914. while (s.ScanToNextParameter())
  915. {
  916. ++result;
  917. }
  918. return result;
  919. }
  920. const char* CClass::ScanToNextParameter()
  921. {
  922. int parenlevel = 1;
  923. while (true)
  924. {
  925. int ch = GetCharacter();
  926. switch (ch)
  927. {
  928. default:
  929. break;
  930. case 0:
  931. printf("end of file scanning for next parameter\n");
  932. /* worst case macro confusion, we go to end of file */
  933. return 0;
  934. case '(':
  935. ++parenlevel;
  936. break;
  937. case ')':
  938. if (--parenlevel == 0)
  939. { /* no next parameter */
  940. return 0;
  941. }
  942. break;
  943. case ',':
  944. if (parenlevel == 1)
  945. {
  946. return m_str;
  947. }
  948. break;
  949. case '#':
  950. /* bad case macro confusion, go to end of statement */
  951. printf("# while scanning for parameters\n");
  952. return 0;
  953. case ';':
  954. /* bad case macro confusion, go to end of statement */
  955. printf("end of statement (;) while scanning for parameters\n");
  956. return 0;
  957. }
  958. }
  959. }
  960. const char* __stdcall CheckRegOpenCommon(CClass& subScanner, int argcRegSam)
  961. {
  962. const char* regsam = subScanner.ScanToNthParameter(argcRegSam);
  963. const char* next = regsam ? subScanner.ScanToNextParameter() : 0;
  964. // allow for it to be last parameter, which it is sometimes
  965. if (!next)
  966. next = subScanner.m_str;
  967. if (!regsam || !next)
  968. {
  969. return szRegOpenNotUnderstood;
  970. }
  971. subScanner.m_str = regsam;
  972. subScanner.m_end = next;
  973. const char* endOfValidSam = subScanner.SpanEnd(UPPER_LETTERS "_|,()0" SPACE);
  974. if (endOfValidSam != next && endOfValidSam != next+1)
  975. {
  976. return szRegOpenNotUnderstood;
  977. }
  978. if (
  979. subScanner.FindString("ALL") // both "all" and "maximum_allowed"
  980. || subScanner.FindString("SET")
  981. || subScanner.FindString("WRITE")
  982. || subScanner.FindString("CREATE")
  983. )
  984. {
  985. return szRegistryWrite;
  986. }
  987. // not a problem, registry only opened for read
  988. return 0;
  989. }
  990. const char* __stdcall CheckSHRegOpen(const CClass& scanner)
  991. {
  992. CClass subScanner(scanner);
  993. return CheckRegOpenCommon(subScanner, 1);
  994. }
  995. const char* __stdcall CheckRegOpenEx(const CClass& scanner)
  996. /*
  997. this function is used for all of RegOpenKeyEx, RegOpenCurrentUser, RegOpenUserClassesRoot,
  998. which is why it uses argc-2 instead of a particular parameter from the start.
  999. */
  1000. {
  1001. CClass subScanner(scanner);
  1002. const int argc = subScanner.CountParameters();
  1003. return CheckRegOpenCommon(subScanner, argc - 2);
  1004. }
  1005. const char* __stdcall CheckCreateObject(const CClass& scanner)
  1006. {
  1007. CClass subScanner(scanner);
  1008. const char* name;
  1009. name = subScanner.ScanToLastParameter();
  1010. if (!name)
  1011. {
  1012. return szCreateObjectNotUnderstood;
  1013. }
  1014. subScanner.m_str = name;
  1015. int ch;
  1016. while (
  1017. (ch = subScanner.GetCharacter())
  1018. && IsSpace(ch)
  1019. )
  1020. {
  1021. }
  1022. name = subScanner.m_str - 1;
  1023. if (!name)
  1024. {
  1025. return szCreateObjectNotUnderstood;
  1026. }
  1027. if (
  1028. strncmp(name, "0", 1) == 0
  1029. || strncmp(name, "NULL", 4) == 0)
  1030. {
  1031. // not a sharing hazard
  1032. return 0;
  1033. }
  1034. return szOpenNamedObject;
  1035. }
  1036. const char* __stdcall CheckCreateFile(const CClass& scanner)
  1037. {
  1038. CClass subScanner(scanner);
  1039. const char* access = subScanner.ScanToNthParameter(1);
  1040. const char* share = access ? subScanner.ScanToNextParameter() : 0;
  1041. const char* endOfValidAccess = 0;
  1042. if (!access || !share)
  1043. {
  1044. return szCreateFileNotUnderstood;
  1045. }
  1046. subScanner.m_str = access;
  1047. subScanner.m_end = share;
  1048. endOfValidAccess = subScanner.SpanEnd(UPPER_LETTERS "_|,()0" SPACE);
  1049. if (endOfValidAccess != share)
  1050. {
  1051. return szCreateFileNotUnderstood;
  1052. }
  1053. /* GENERIC_WRITE WRITE_DAC WRITE_OWNER STANDARD_RIGHTS_WRITE
  1054. STANDARD_RIGHTS_ALL SPECIFIC_RIGHTS_ALL MAXIMUM_ALLOWED GENERIC_ALL
  1055. */
  1056. if (
  1057. subScanner.FindString("WRITE")
  1058. || subScanner.FindString("ALL")
  1059. || subScanner.FindString("0")
  1060. )
  1061. {
  1062. return szFileWrite;
  1063. }
  1064. return 0;
  1065. }
  1066. void CClass::Warn(const char* message) const
  1067. {
  1068. if (message && *message)
  1069. {
  1070. //PrintOpenComment();
  1071. printf("%s(%d): %s\n", m_fullPath, m_line.m_number, message);
  1072. //PrintCloseComment();
  1073. }
  1074. else
  1075. {
  1076. PrintSeperator();
  1077. }
  1078. PrintCode();
  1079. }
  1080. bool CClass::OpenFile(const char* name)
  1081. {
  1082. if (FAILED(m_file.HrCreate(name, GENERIC_READ, FILE_SHARE_READ, OPEN_EXISTING)))
  1083. return false;
  1084. if (FAILED(m_fileMapping.HrCreate(m_file, PAGE_READONLY)))
  1085. return false;
  1086. if (FAILED(m_view.HrCreate(m_fileMapping, FILE_MAP_READ)))
  1087. return false;
  1088. m_str = reinterpret_cast<const char*>(static_cast<const void*>(m_view));
  1089. m_end = m_str + m_file.GetSize();
  1090. m_nextLine.m_start = m_line.m_start = m_str;
  1091. m_nextLine.m_number += 1;
  1092. return true;
  1093. }
  1094. void CClass::RecordStatement(int ch)
  1095. {
  1096. if (ch == ';' || ch == '{' || ch == eTokenTypePreprocessorDirective /*|| ch == '}'*/)
  1097. {
  1098. if (!m_statementStart)
  1099. {
  1100. m_statementStart = m_str;
  1101. }
  1102. else
  1103. {
  1104. CStatement statement = { m_statementStart, m_str};
  1105. m_statements[m_istatement % NUMBER_OF(m_statements)] = statement;
  1106. ++m_istatement;
  1107. m_statementStart = m_str;
  1108. }
  1109. }
  1110. }
  1111. /* do this before iterating over them to print them, this makes the iteration
  1112. interface simple */
  1113. void CClass::OrderStatements() const /* mutable */
  1114. {
  1115. const int N = NUMBER_OF(m_statements);
  1116. CStatement temp[N];
  1117. std::copy(m_statements, m_statements + N, temp);
  1118. for (int i = 0 ; i != N ; ++i)
  1119. {
  1120. m_statements[i] = temp[(m_istatement + i) % N];
  1121. }
  1122. m_istatement = 0;
  1123. }
  1124. void __stdcall PrintOpenComment()
  1125. {
  1126. const int N = 76;
  1127. static char str[N];
  1128. if (!str[0])
  1129. {
  1130. std::fill(str + 1, str + N - 1, '-');
  1131. str[2] = '*';
  1132. str[1] = '/';
  1133. str[0] = '\n';
  1134. }
  1135. fputs(str, stdout);
  1136. }
  1137. void __stdcall PrintCloseComment()
  1138. {
  1139. const int N = 76;
  1140. static char str[N];
  1141. if (!str[0])
  1142. {
  1143. std::fill(str + 1, str + N - 1, '-');
  1144. str[N-3] = '*';
  1145. str[N-2] = '/';
  1146. str[0] = '\n';
  1147. }
  1148. fputs(str, stdout);
  1149. }
  1150. void __stdcall PrintSeperator()
  1151. {
  1152. const int N = 76;
  1153. static char str[N];
  1154. if (!str[0])
  1155. {
  1156. std::fill(str + 1, str + N - 1, '-');
  1157. str[0] = '\n';
  1158. }
  1159. fputs(str, stdout);
  1160. }
  1161. void __stdcall TrimSpaces(const char** begin, const char** end)
  1162. {
  1163. while (*begin != *end && IsSpace(**begin))
  1164. {
  1165. ++*begin;
  1166. }
  1167. while (*begin != *end && IsSpace(*(*end - 1)))
  1168. {
  1169. --*end;
  1170. }
  1171. }
  1172. void __stdcall PrintString(const char* begin, const char* end)
  1173. {
  1174. if (begin && end > begin)
  1175. {
  1176. int length = end - begin;
  1177. printf("%.*s", length, begin);
  1178. }
  1179. }
  1180. const char* __stdcall RemoveLeadingSpace(const char* begin, const char* end)
  1181. {
  1182. if (begin != end && IsSpace(*begin))
  1183. {
  1184. while (begin != end && IsSpace(*begin))
  1185. {
  1186. ++begin;
  1187. }
  1188. }
  1189. return begin;
  1190. }
  1191. const char* __stdcall RemoveLeadingVerticalSpace(const char* begin, const char* end)
  1192. {
  1193. if (begin != end && IsVerticalSpace(*begin))
  1194. {
  1195. while (begin != end && IsVerticalSpace(*begin))
  1196. {
  1197. ++begin;
  1198. }
  1199. }
  1200. return begin;
  1201. }
  1202. const char* __stdcall OneLeadingVerticalSpace(const char* begin, const char* end)
  1203. {
  1204. if (begin != end && IsVerticalSpace(*begin))
  1205. {
  1206. while (begin != end && IsVerticalSpace(*begin))
  1207. {
  1208. ++begin;
  1209. }
  1210. --begin;
  1211. }
  1212. return begin;
  1213. }
  1214. const char* __stdcall RemoveTrailingSpace(const char* begin, const char* end)
  1215. {
  1216. if (begin != end && IsSpace(*(end-1)))
  1217. {
  1218. while (begin != end && IsSpace(*(end-1)))
  1219. {
  1220. --end;
  1221. }
  1222. }
  1223. return end;
  1224. }
  1225. const char* __stdcall RemoveTrailingVerticalSpace(const char* begin, const char* end)
  1226. {
  1227. if (begin != end && IsVerticalSpace(*(end-1)))
  1228. {
  1229. while (begin != end && IsVerticalSpace(*(end-1)))
  1230. {
  1231. --end;
  1232. }
  1233. }
  1234. return end;
  1235. }
  1236. const char* __stdcall OneTrailingVerticalSpace(const char* begin, const char* end)
  1237. {
  1238. if (begin != end && IsVerticalSpace(*(end-1)))
  1239. {
  1240. while (begin != end && IsVerticalSpace(*(end-1)))
  1241. {
  1242. --end;
  1243. }
  1244. ++end;
  1245. }
  1246. return end;
  1247. }
  1248. void CClass::PrintCode() const
  1249. {
  1250. // this function is messy wrt when newlines are printed
  1251. //PrintSeperator();
  1252. OrderStatements();
  1253. int i;
  1254. if (g_nPrintContextStatements)
  1255. {
  1256. const char* previousStatementsEnd = 0;
  1257. for (i = NUMBER_OF(m_statements) - g_nPrintContextStatements ; i != NUMBER_OF(m_statements) ; i++)
  1258. {
  1259. if (m_statements[i].begin && m_statements[i].end)
  1260. {
  1261. previousStatementsEnd = m_statements[i].end;
  1262. // for the first iteration, limit ourselves to one newline
  1263. if (i == NUMBER_OF(m_statements) - g_nPrintContextStatements)
  1264. {
  1265. m_statements[i].begin = RemoveLeadingVerticalSpace(m_statements[i].begin, m_statements[i].end);
  1266. }
  1267. PrintString(m_statements[i].begin, m_statements[i].end);
  1268. }
  1269. }
  1270. if (previousStatementsEnd)
  1271. {
  1272. PrintString(previousStatementsEnd, m_line.m_start);
  1273. }
  1274. }
  1275. const char* newlineChar = SequenceLinearFindValue(m_line.m_start, m_end, '\n');
  1276. const char* returnChar = SequenceLinearFindValue(m_line.m_start, m_end, '\r');
  1277. const char* endOfLine = std::min(newlineChar, returnChar);
  1278. int outputLineOffset = 0;
  1279. int lineLength = endOfLine - m_line.m_start;
  1280. if (g_fPrintLine)
  1281. {
  1282. printf("%.*s\n", lineLength, m_line.m_start);
  1283. }
  1284. // underline the offending hazardous function with carets
  1285. if (g_nPrintContextStatements)
  1286. {
  1287. // skip the part of the line preceding the hazardous functon,
  1288. // print tabs where it has tabs
  1289. for (i = 0 ; i < m_str - m_line.m_start - m_hazardousFunction->apiLength ; ++i)
  1290. {
  1291. fputs((m_line.m_start[i] != '\t') ? " " : "\t"/*" "*/, stdout);
  1292. }
  1293. // underline the function with carets
  1294. for (i = 0 ; i < m_hazardousFunction->apiLength ; ++i)
  1295. putchar('^');
  1296. putchar('\n');
  1297. }
  1298. // find the approximate end of statement
  1299. const char* statementSemi = SequenceLinearFindValue(m_line.m_start, m_end, ';');
  1300. const char* statementBrace = SequenceLinearFindValue(m_line.m_start, m_end, '{'); // }
  1301. const char* statementPound = SequenceLinearFindValue(m_line.m_start, m_end, '#');
  1302. // statements don't really end in a pound, but this helps terminate output
  1303. // in some cases
  1304. const char* statementEnd = RemoveTrailingSpace(m_line.m_start, std::min(std::min(statementSemi, statementBrace), statementPound));
  1305. if (g_fPrintFullStatement)
  1306. {
  1307. if (statementEnd > endOfLine)
  1308. {
  1309. const char* statementBegin = RemoveLeadingVerticalSpace(endOfLine, statementEnd);
  1310. if (*statementEnd == ';')
  1311. {
  1312. ++statementEnd;
  1313. }
  1314. PrintString(statementBegin, statementEnd);
  1315. if (!g_nPrintContextStatements)
  1316. {
  1317. putchar('\n');
  1318. }
  1319. }
  1320. else
  1321. {
  1322. if (*statementEnd == ';')
  1323. {
  1324. ++statementEnd;
  1325. }
  1326. }
  1327. }
  1328. // print more statements after it
  1329. if (g_nPrintContextStatements)
  1330. {
  1331. for (i = 0 ; i != g_nPrintContextStatements ; ++i)
  1332. {
  1333. // and then a few more
  1334. const char* statement2 = SequenceLinearFindValue(statementEnd, m_end, ';');
  1335. if (i == 0)
  1336. {
  1337. statementEnd = RemoveLeadingVerticalSpace(statementEnd, statement2);
  1338. }
  1339. if (i == g_nPrintContextStatements-1)
  1340. {
  1341. statement2 = RemoveTrailingSpace(statementEnd, statement2);
  1342. PrintString(statementEnd, statement2);
  1343. putchar(';');
  1344. putchar('\n');
  1345. }
  1346. else
  1347. {
  1348. PrintString(statementEnd, statement2);
  1349. putchar(';');
  1350. }
  1351. statementEnd = statement2 + (statement2 != m_end);
  1352. }
  1353. }
  1354. }
  1355. int CSharingHazardCheck::ProcessFile(const std::string& name)
  1356. {
  1357. // test argv processing
  1358. // std::cout << name << std::endl;
  1359. // return;
  1360. int total = 0;
  1361. CClass scanner;
  1362. ETokenType m_eTokenType = INT_TO_ENUM_CAST(ETokenType)(0);
  1363. scanner.m_fullPath[0] = 0;
  1364. if (!GetFullPathName(name.c_str(), NUMBER_OF(scanner.m_fullPath), scanner.m_fullPath, NULL))
  1365. strcpy(scanner.m_fullPath, name.c_str());
  1366. if (!scanner.OpenFile(scanner.m_fullPath))
  1367. return total;
  1368. scanner.RecordStatement(';');
  1369. // we "parse" token :: token, to avoid these false positives
  1370. int idColonColonState = 0;
  1371. while (m_eTokenType = scanner.GetToken())
  1372. {
  1373. scanner.RecordStatement(m_eTokenType);
  1374. switch (m_eTokenType)
  1375. {
  1376. default:
  1377. idColonColonState = 0;
  1378. break;
  1379. case eTokenTypeIdentifier:
  1380. idColonColonState = 1;
  1381. break;
  1382. case ':':
  1383. switch (idColonColonState)
  1384. {
  1385. case 1:
  1386. idColonColonState = 2;
  1387. break;
  1388. case 2:
  1389. // skip a token
  1390. // idColonColonState = 3;
  1391. scanner.GetToken();
  1392. // idColonColonState = 0;
  1393. // break;
  1394. case 0:
  1395. //case 3:
  1396. idColonColonState = 0;
  1397. break;
  1398. }
  1399. break;
  1400. case '>': // second bogus token in ->
  1401. case '.':
  1402. // skip a token to avoid foo->OpenFile, foo.OpenFile
  1403. scanner.GetToken();
  1404. break;
  1405. case eTokenTypeHazardousFunction:
  1406. {
  1407. if (scanner.m_hazardousFunction->function)
  1408. {
  1409. const char* message = scanner.m_hazardousFunction->function(scanner);
  1410. if (message)
  1411. {
  1412. total += 1;
  1413. scanner.Warn(message);
  1414. }
  1415. }
  1416. else if (scanner.m_hazardousFunction->message)
  1417. {
  1418. total += 1;
  1419. scanner.Warn(scanner.m_hazardousFunction->message);
  1420. }
  1421. else
  1422. {
  1423. scanner.Warn();
  1424. BreakPoint();
  1425. }
  1426. }
  1427. break;
  1428. }
  1429. }
  1430. return total;
  1431. }
  1432. bool __stdcall Contains(const char* s, const char* set)
  1433. {
  1434. return s && *s && strcspn(s, set) != strlen(s);
  1435. }
  1436. bool ContainsSlashes(const char* s) { return Contains(s, "\\/"); }
  1437. bool ContainsSlash(const char* s) { return ContainsSlashes(s); }
  1438. bool ContainsWildcards(const char* s) { return Contains(s, "*?"); }
  1439. bool IsSlash(int ch) { return (ch == '\\' || ch == '/'); }
  1440. std::string PathAppend(const std::string& s, const std::string& t)
  1441. {
  1442. // why does string lack back()?
  1443. int sslash = IsSlash(*(s.end() - 1)) ? 2 : 0;
  1444. int tslash = IsSlash(*t.begin()) ? 1 : 0;
  1445. switch (sslash | tslash)
  1446. {
  1447. case 0:
  1448. return (s + '\\' + t);
  1449. case 1:
  1450. case 2:
  1451. return (s + t);
  1452. case 3:
  1453. return (s + t.substr(1));
  1454. }
  1455. return std::string();
  1456. }
  1457. void __stdcall PathSplitOffLast(const std::string& s, std::string* a, std::string* b)
  1458. {
  1459. std::string::size_type slash = s.find_last_of("\\/");
  1460. *a = s.substr(0, slash);
  1461. *b = s.substr(slash + 1);
  1462. }
  1463. std::string __stdcall PathRemoveLastElement(const std::string& s)
  1464. {
  1465. return s.substr(0, s.find_last_of("\\/"));
  1466. }
  1467. bool __stdcall IsDotOrDotDot(const char* s)
  1468. {
  1469. return s[0] == '.' && (s[1] == 0 || (s[1] == '.' && s[2] == 0));
  1470. }
  1471. void CSharingHazardCheck::ProcessArgs(int argc, char** argv, std::vector<std::string>& files)
  1472. {
  1473. int i;
  1474. char fullpath[1U<<16]; fullpath[0] = 0;
  1475. char currentDirectory[1U << 16]; currentDirectory[0] = 0;
  1476. bool fRecurse = false;
  1477. std::vector<std::string> directories;
  1478. std::vector<std::string> genericWildcards;
  1479. std::vector<std::string> particularWildcards;
  1480. bool fWarnEmptyWildcards = true;
  1481. currentDirectory[0] = 0;
  1482. GetCurrentDirectory(NUMBER_OF(currentDirectory), currentDirectory);
  1483. for (i = 1 ; i < argc ; ++i)
  1484. {
  1485. switch (argv[i][0])
  1486. {
  1487. default:
  1488. if (ContainsWildcards(argv[i]))
  1489. {
  1490. if (ContainsSlash(argv[i]))
  1491. {
  1492. // these will only be applied once, in whatever
  1493. // path they specifically refer
  1494. if (GetFullPathName(argv[i], NUMBER_OF(fullpath), fullpath, NULL))
  1495. {
  1496. particularWildcards.push_back(fullpath);
  1497. }
  1498. else
  1499. {
  1500. printf("GetFullPathName failed %s\n", argv[i]);
  1501. }
  1502. }
  1503. else
  1504. {
  1505. // do NOT call GetFullPathName here
  1506. genericWildcards.push_back(argv[i]);
  1507. }
  1508. }
  1509. else
  1510. {
  1511. if (GetFullPathName(argv[i], NUMBER_OF(fullpath), fullpath, NULL))
  1512. {
  1513. DWORD dwFileAttributes = GetFileAttributes(fullpath);
  1514. if (dwFileAttributes != 0xFFFFFFFF)
  1515. {
  1516. if (dwFileAttributes & FILE_ATTRIBUTE_DIRECTORY)
  1517. {
  1518. directories.push_back(fullpath);
  1519. }
  1520. else
  1521. {
  1522. files.push_back(fullpath);
  1523. }
  1524. }
  1525. else
  1526. {
  1527. printf("%s nonexistant\n", fullpath);
  1528. }
  1529. }
  1530. else
  1531. printf("GetFullPathName failed %s\n", argv[i]);
  1532. }
  1533. break;
  1534. /*
  1535. default output
  1536. file(line):reason
  1537. -recurse
  1538. -print-line
  1539. prints line of code with offending function after file(line):reason
  1540. -print-statement
  1541. print statement containing offending function after file(line):reason
  1542. supersedes -print-line
  1543. -print-context-lines:n
  1544. -print-statement plus surrounding n lines (not implemented)
  1545. -print-context-statements:n
  1546. -print-statement plus surrounding n "statements" (count semis and braces)
  1547. file names apply across all directories recursed into
  1548. wild cards apply across all directories recursed into
  1549. naming a directory implies one level recursion (unless -recurse is also seen)
  1550. environment variable SHARING_HAZARD_CHECK_OPTIONS added to argv (not implemented)
  1551. all directory walking happens before any output is generated
  1552. */
  1553. case '-':
  1554. case '/':
  1555. argv[i] += 1;
  1556. static const char szRecurse[] = "recurse";
  1557. static const char szPrintStatement[] = "print-statement";
  1558. static const char szPrintLine[] = "print-line";
  1559. static const char szPrintContextLines[] = "print-context-lines";
  1560. static const char szPrintContextStatements[] = "print-context-statements";
  1561. switch (argv[i][0])
  1562. {
  1563. default:
  1564. printf("unknown switch %s\n", argv[i]);
  1565. break;
  1566. case 'r': case 'R':
  1567. if (0 == _stricmp(argv[i]+1, 1 + szRecurse))
  1568. {
  1569. fRecurse = true;
  1570. }
  1571. break;
  1572. case 'p': case 'P':
  1573. if (0 == _strnicmp(argv[i]+1, "rint-", 5))
  1574. {
  1575. if (0 == _stricmp(
  1576. 6 + argv[i],
  1577. 6 + szPrintLine
  1578. ))
  1579. {
  1580. g_fPrintLine = true;
  1581. }
  1582. else if (0 == _stricmp(
  1583. 6 + argv[i],
  1584. 6 + szPrintStatement
  1585. ))
  1586. {
  1587. g_fPrintFullStatement = true;
  1588. g_fPrintLine = true;
  1589. }
  1590. else if (0 == _strnicmp(
  1591. 6 + argv[i],
  1592. 6 + szPrintContextLines,
  1593. NUMBER_OF(szPrintContextLines) - 6
  1594. ))
  1595. {
  1596. printf("unimplemented switch %s\n", argv[i]);
  1597. }
  1598. else if (0 == _strnicmp(
  1599. 6 + argv[i],
  1600. 6 + szPrintContextStatements,
  1601. NUMBER_OF(szPrintContextLines) - 6))
  1602. {
  1603. if (argv[i][NUMBER_OF(szPrintContextStatements)-1] == ':')
  1604. {
  1605. g_nPrintContextStatements = atoi(argv[i] + NUMBER_OF(szPrintContextStatements));
  1606. g_nPrintContextStatements = std::min<int>(g_nPrintContextStatements, NUMBER_OF(CClass().m_statements));
  1607. g_nPrintContextStatements = std::max<int>(g_nPrintContextStatements, 1);
  1608. }
  1609. else
  1610. {
  1611. g_nPrintContextStatements = 2;
  1612. }
  1613. g_fPrintFullStatement = true;
  1614. g_fPrintLine = true;
  1615. }
  1616. }
  1617. break;
  1618. }
  1619. break;
  1620. }
  1621. }
  1622. if (fRecurse)
  1623. {
  1624. // split up particular wildcards into directories and generic wildcards
  1625. for (std::vector<std::string>::const_iterator i = particularWildcards.begin();
  1626. i != particularWildcards.end();
  1627. ++i
  1628. )
  1629. {
  1630. std::string path;
  1631. std::string wild;
  1632. PathSplitOffLast(*i, &path, &wild);
  1633. directories.push_back(path);
  1634. genericWildcards.push_back(wild);
  1635. //printf("%s%s -> %s %s\n", path.c_str(), wild.c_str(), path.c_str(), wild.c_str());
  1636. }
  1637. particularWildcards.clear();
  1638. }
  1639. // empty command line produces nothing, by design
  1640. if (genericWildcards.empty()
  1641. && !directories.empty()
  1642. )
  1643. {
  1644. genericWildcards.push_back("*");
  1645. }
  1646. else if (
  1647. directories.empty()
  1648. && files.empty()
  1649. && !genericWildcards.empty())
  1650. {
  1651. directories.push_back(currentDirectory);
  1652. }
  1653. if (!directories.empty()
  1654. || !genericWildcards.empty()
  1655. || !particularWildcards.empty()
  1656. || fRecurse
  1657. )
  1658. {
  1659. // if you don't output the \n and let the .s word wrap,
  1660. // f4 in the output gets messed up wrt which line gets highlighted
  1661. printf("processing argv..\n"); fflush(stdout);
  1662. #define ARGV_PROGRESS() printf("."); fflush(stdout);
  1663. #undef ARGV_PROGRESS
  1664. #define ARGV_PROGRESS() printf("processing argv..\n"); fflush(stdout);
  1665. #undef ARGV_PROGRESS
  1666. #define ARGV_PROGRESS() /* nothing */
  1667. }
  1668. WIN32_FIND_DATA findData;
  1669. if (!directories.empty())
  1670. {
  1671. std::set<std::string> allDirectoriesSeen; // avoid repeats when recursing
  1672. std::stack<std::string> stack;
  1673. for (std::vector<std::string>::const_iterator i = directories.begin();
  1674. i != directories.end();
  1675. ++i
  1676. )
  1677. {
  1678. stack.push(*i);
  1679. }
  1680. while (!stack.empty())
  1681. {
  1682. std::string directory = stack.top();
  1683. stack.pop();
  1684. if (!fRecurse || allDirectoriesSeen.find(directory) == allDirectoriesSeen.end())
  1685. {
  1686. if (fRecurse)
  1687. {
  1688. allDirectoriesSeen.insert(allDirectoriesSeen.end(), directory);
  1689. }
  1690. for
  1691. (
  1692. std::vector<std::string>::const_iterator w = genericWildcards.begin();
  1693. w != genericWildcards.end();
  1694. ++w
  1695. )
  1696. {
  1697. std::string file = PathAppend(directory, *w);
  1698. CFindFile findFile;
  1699. if (SUCCEEDED(findFile.HrCreate(file.c_str(), &findData)))
  1700. {
  1701. fWarnEmptyWildcards = false;
  1702. ARGV_PROGRESS();
  1703. // only match files here
  1704. do
  1705. {
  1706. if ((findData.dwFileAttributes & FILE_ATTRIBUTE_DIRECTORY) == 0)
  1707. {
  1708. files.push_back(PathAppend(directory, findData.cFileName));
  1709. }
  1710. } while (FindNextFile(findFile, &findData));
  1711. }
  1712. else
  1713. {
  1714. if (fWarnEmptyWildcards)
  1715. printf("warning: %s expanded to nothing\n", file.c_str());
  1716. }
  1717. if (fRecurse)
  1718. {
  1719. // only match directories here
  1720. std::string star = PathAppend(directory, "*");
  1721. CFindFile findFile;
  1722. if (SUCCEEDED(findFile.HrCreate(star.c_str(), &findData)))
  1723. {
  1724. fWarnEmptyWildcards = false;
  1725. ARGV_PROGRESS();
  1726. do
  1727. {
  1728. if (!IsDotOrDotDot(findData.cFileName)
  1729. && (findData.dwFileAttributes & FILE_ATTRIBUTE_DIRECTORY))
  1730. {
  1731. stack.push(PathAppend(directory, findData.cFileName));
  1732. }
  1733. } while (FindNextFile(findFile, &findData));
  1734. }
  1735. else
  1736. {
  1737. if (fWarnEmptyWildcards)
  1738. printf("warning: %s expanded to nothing\n", star.c_str());
  1739. }
  1740. }
  1741. }
  1742. }
  1743. }
  1744. }
  1745. // particular wildcards only match files, not directories
  1746. for
  1747. (
  1748. std::vector<std::string>::const_iterator w = particularWildcards.begin();
  1749. w != particularWildcards.end();
  1750. ++w
  1751. )
  1752. {
  1753. std::string directory = PathRemoveLastElement(*w);
  1754. CFindFile findFile;
  1755. if (SUCCEEDED(findFile.HrCreate(w->c_str(), &findData)))
  1756. {
  1757. fWarnEmptyWildcards = false;
  1758. ARGV_PROGRESS();
  1759. // only match files here
  1760. do
  1761. {
  1762. if ((findData.dwFileAttributes & FILE_ATTRIBUTE_DIRECTORY) == 0)
  1763. {
  1764. files.push_back(PathAppend(directory, findData.cFileName));
  1765. }
  1766. } while (FindNextFile(findFile, &findData));
  1767. }
  1768. else
  1769. {
  1770. // if (fWarnEmptyWildcards) // always warn for "particular wildcards"
  1771. printf("warning: %s expanded to nothing\n", w->c_str());
  1772. }
  1773. }
  1774. std::sort(files.begin(), files.end());
  1775. files.resize(std::unique(files.begin(), files.end()) - files.begin());
  1776. printf("\n");
  1777. }
  1778. void CSharingHazardCheck::Main(int argc, char** argv)
  1779. {
  1780. if (argc < 2)
  1781. {
  1782. printf(usage, argv[0]);
  1783. exit(EXIT_FAILURE);
  1784. }
  1785. printf(banner);
  1786. std::vector<std::string> files;
  1787. ProcessArgs(argc, argv, files);
  1788. InitTables();
  1789. int total = 0;
  1790. for (
  1791. std::vector<std::string>::const_iterator i = files.begin();
  1792. i != files.end();
  1793. ++i
  1794. )
  1795. {
  1796. total += ProcessFile(*i);
  1797. }
  1798. printf("\n%d warnings\n", total);
  1799. }
  1800. int __cdecl main(int argc, char** argv)
  1801. {
  1802. app.Main(argc, argv);
  1803. return 0;
  1804. }