xmlrole.c 33 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401
  1. /*
  2. Copyright (c) 1998, 1999 Thai Open Source Software Center Ltd
  3. See the file COPYING for copying permission.
  4. */
  5. static char RCSId[]
  6. = "$Header$";
  7. const char* cm_expat_GetXMLRole_RCSId()
  8. {
  9. /* Avoid warning about unused static without removing RCSId from original. */
  10. return RCSId;
  11. }
  12. #include <cmexpat/expatConfig.h>
  13. #include "xmlrole.h"
  14. #include "ascii.h"
  15. /* Doesn't check:
  16. that ,| are not mixed in a model group
  17. content of literals
  18. */
  19. static const char KW_ANY[] = { ASCII_A, ASCII_N, ASCII_Y, '\0' };
  20. static const char KW_ATTLIST[] = { ASCII_A, ASCII_T, ASCII_T, ASCII_L, ASCII_I, ASCII_S, ASCII_T, '\0' };
  21. static const char KW_CDATA[] = { ASCII_C, ASCII_D, ASCII_A, ASCII_T, ASCII_A, '\0' };
  22. static const char KW_DOCTYPE[] = { ASCII_D, ASCII_O, ASCII_C, ASCII_T, ASCII_Y, ASCII_P, ASCII_E, '\0' };
  23. static const char KW_ELEMENT[] = { ASCII_E, ASCII_L, ASCII_E, ASCII_M, ASCII_E, ASCII_N, ASCII_T, '\0' };
  24. static const char KW_EMPTY[] = { ASCII_E, ASCII_M, ASCII_P, ASCII_T, ASCII_Y, '\0' };
  25. static const char KW_ENTITIES[] = { ASCII_E, ASCII_N, ASCII_T, ASCII_I, ASCII_T, ASCII_I, ASCII_E, ASCII_S, '\0' };
  26. static const char KW_ENTITY[] = { ASCII_E, ASCII_N, ASCII_T, ASCII_I, ASCII_T, ASCII_Y, '\0' };
  27. static const char KW_FIXED[] = { ASCII_F, ASCII_I, ASCII_X, ASCII_E, ASCII_D, '\0' };
  28. static const char KW_ID[] = { ASCII_I, ASCII_D, '\0' };
  29. static const char KW_IDREF[] = { ASCII_I, ASCII_D, ASCII_R, ASCII_E, ASCII_F, '\0' };
  30. static const char KW_IDREFS[] = { ASCII_I, ASCII_D, ASCII_R, ASCII_E, ASCII_F, ASCII_S, '\0' };
  31. static const char KW_IGNORE[] = { ASCII_I, ASCII_G, ASCII_N, ASCII_O, ASCII_R, ASCII_E, '\0' };
  32. static const char KW_IMPLIED[] = { ASCII_I, ASCII_M, ASCII_P, ASCII_L, ASCII_I, ASCII_E, ASCII_D, '\0' };
  33. static const char KW_INCLUDE[] = { ASCII_I, ASCII_N, ASCII_C, ASCII_L, ASCII_U, ASCII_D, ASCII_E, '\0' };
  34. static const char KW_NDATA[] = { ASCII_N, ASCII_D, ASCII_A, ASCII_T, ASCII_A, '\0' };
  35. static const char KW_NMTOKEN[] = { ASCII_N, ASCII_M, ASCII_T, ASCII_O, ASCII_K, ASCII_E, ASCII_N, '\0' };
  36. static const char KW_NMTOKENS[] = { ASCII_N, ASCII_M, ASCII_T, ASCII_O, ASCII_K, ASCII_E, ASCII_N, ASCII_S, '\0' };
  37. static const char KW_NOTATION[] = { ASCII_N, ASCII_O, ASCII_T, ASCII_A, ASCII_T, ASCII_I, ASCII_O, ASCII_N, '\0' };
  38. static const char KW_PCDATA[] = { ASCII_P, ASCII_C, ASCII_D, ASCII_A, ASCII_T, ASCII_A, '\0' };
  39. static const char KW_PUBLIC[] = { ASCII_P, ASCII_U, ASCII_B, ASCII_L, ASCII_I, ASCII_C, '\0' };
  40. static const char KW_REQUIRED[] = { ASCII_R, ASCII_E, ASCII_Q, ASCII_U, ASCII_I, ASCII_R, ASCII_E, ASCII_D, '\0' };
  41. static const char KW_SYSTEM[] = { ASCII_S, ASCII_Y, ASCII_S, ASCII_T, ASCII_E, ASCII_M, '\0' };
  42. #ifndef MIN_BYTES_PER_CHAR
  43. #define MIN_BYTES_PER_CHAR(enc) ((enc)->minBytesPerChar)
  44. #endif
  45. #ifdef XML_DTD
  46. #define setTopLevel(state) \
  47. ((state)->handler = ((state)->documentEntity \
  48. ? internalSubset \
  49. : externalSubset1))
  50. #else /* not XML_DTD */
  51. #define setTopLevel(state) ((state)->handler = internalSubset)
  52. #endif /* not XML_DTD */
  53. typedef int PROLOG_HANDLER(PROLOG_STATE *state,
  54. int tok,
  55. const char *ptr,
  56. const char *end,
  57. const ENCODING *enc);
  58. static PROLOG_HANDLER
  59. prolog0, prolog1, prolog2,
  60. doctype0, doctype1, doctype2, doctype3, doctype4, doctype5,
  61. internalSubset,
  62. entity0, entity1, entity2, entity3, entity4, entity5, entity6,
  63. entity7, entity8, entity9,
  64. notation0, notation1, notation2, notation3, notation4,
  65. attlist0, attlist1, attlist2, attlist3, attlist4, attlist5, attlist6,
  66. attlist7, attlist8, attlist9,
  67. element0, element1, element2, element3, element4, element5, element6,
  68. element7,
  69. #ifdef XML_DTD
  70. externalSubset0, externalSubset1,
  71. condSect0, condSect1, condSect2,
  72. #endif /* XML_DTD */
  73. declClose,
  74. error;
  75. static
  76. int common(PROLOG_STATE *state, int tok);
  77. static
  78. int prolog0(PROLOG_STATE *state,
  79. int tok,
  80. const char *ptr,
  81. const char *end,
  82. const ENCODING *enc)
  83. {
  84. switch (tok) {
  85. case XML_TOK_PROLOG_S:
  86. state->handler = prolog1;
  87. return XML_ROLE_NONE;
  88. case XML_TOK_XML_DECL:
  89. state->handler = prolog1;
  90. return XML_ROLE_XML_DECL;
  91. case XML_TOK_PI:
  92. state->handler = prolog1;
  93. return XML_ROLE_NONE;
  94. case XML_TOK_COMMENT:
  95. state->handler = prolog1;
  96. case XML_TOK_BOM:
  97. return XML_ROLE_NONE;
  98. case XML_TOK_DECL_OPEN:
  99. if (!XmlNameMatchesAscii(enc,
  100. ptr + 2 * MIN_BYTES_PER_CHAR(enc),
  101. end,
  102. KW_DOCTYPE))
  103. break;
  104. state->handler = doctype0;
  105. return XML_ROLE_NONE;
  106. case XML_TOK_INSTANCE_START:
  107. state->handler = error;
  108. return XML_ROLE_INSTANCE_START;
  109. }
  110. return common(state, tok);
  111. }
  112. static
  113. int prolog1(PROLOG_STATE *state,
  114. int tok,
  115. const char *ptr,
  116. const char *end,
  117. const ENCODING *enc)
  118. {
  119. switch (tok) {
  120. case XML_TOK_PROLOG_S:
  121. return XML_ROLE_NONE;
  122. case XML_TOK_PI:
  123. case XML_TOK_COMMENT:
  124. case XML_TOK_BOM:
  125. return XML_ROLE_NONE;
  126. case XML_TOK_DECL_OPEN:
  127. if (!XmlNameMatchesAscii(enc,
  128. ptr + 2 * MIN_BYTES_PER_CHAR(enc),
  129. end,
  130. KW_DOCTYPE))
  131. break;
  132. state->handler = doctype0;
  133. return XML_ROLE_NONE;
  134. case XML_TOK_INSTANCE_START:
  135. state->handler = error;
  136. return XML_ROLE_INSTANCE_START;
  137. }
  138. return common(state, tok);
  139. }
  140. static
  141. int prolog2(PROLOG_STATE *state,
  142. int tok,
  143. const char *ptr,
  144. const char *end,
  145. const ENCODING *enc)
  146. {
  147. cmExpatUnused(ptr);
  148. cmExpatUnused(end);
  149. cmExpatUnused(enc);
  150. switch (tok) {
  151. case XML_TOK_PROLOG_S:
  152. return XML_ROLE_NONE;
  153. case XML_TOK_PI:
  154. case XML_TOK_COMMENT:
  155. return XML_ROLE_NONE;
  156. case XML_TOK_INSTANCE_START:
  157. state->handler = error;
  158. return XML_ROLE_INSTANCE_START;
  159. }
  160. return common(state, tok);
  161. }
  162. static
  163. int doctype0(PROLOG_STATE *state,
  164. int tok,
  165. const char *ptr,
  166. const char *end,
  167. const ENCODING *enc)
  168. {
  169. cmExpatUnused(ptr);
  170. cmExpatUnused(end);
  171. cmExpatUnused(enc);
  172. switch (tok) {
  173. case XML_TOK_PROLOG_S:
  174. return XML_ROLE_NONE;
  175. case XML_TOK_NAME:
  176. case XML_TOK_PREFIXED_NAME:
  177. state->handler = doctype1;
  178. return XML_ROLE_DOCTYPE_NAME;
  179. }
  180. return common(state, tok);
  181. }
  182. static
  183. int doctype1(PROLOG_STATE *state,
  184. int tok,
  185. const char *ptr,
  186. const char *end,
  187. const ENCODING *enc)
  188. {
  189. switch (tok) {
  190. case XML_TOK_PROLOG_S:
  191. return XML_ROLE_NONE;
  192. case XML_TOK_OPEN_BRACKET:
  193. state->handler = internalSubset;
  194. return XML_ROLE_DOCTYPE_INTERNAL_SUBSET;
  195. case XML_TOK_DECL_CLOSE:
  196. state->handler = prolog2;
  197. return XML_ROLE_DOCTYPE_CLOSE;
  198. case XML_TOK_NAME:
  199. if (XmlNameMatchesAscii(enc, ptr, end, KW_SYSTEM)) {
  200. state->handler = doctype3;
  201. return XML_ROLE_NONE;
  202. }
  203. if (XmlNameMatchesAscii(enc, ptr, end, KW_PUBLIC)) {
  204. state->handler = doctype2;
  205. return XML_ROLE_NONE;
  206. }
  207. break;
  208. }
  209. return common(state, tok);
  210. }
  211. static
  212. int doctype2(PROLOG_STATE *state,
  213. int tok,
  214. const char *ptr,
  215. const char *end,
  216. const ENCODING *enc)
  217. {
  218. cmExpatUnused(ptr);
  219. cmExpatUnused(end);
  220. cmExpatUnused(enc);
  221. switch (tok) {
  222. case XML_TOK_PROLOG_S:
  223. return XML_ROLE_NONE;
  224. case XML_TOK_LITERAL:
  225. state->handler = doctype3;
  226. return XML_ROLE_DOCTYPE_PUBLIC_ID;
  227. }
  228. return common(state, tok);
  229. }
  230. static
  231. int doctype3(PROLOG_STATE *state,
  232. int tok,
  233. const char *ptr,
  234. const char *end,
  235. const ENCODING *enc)
  236. {
  237. cmExpatUnused(ptr);
  238. cmExpatUnused(end);
  239. cmExpatUnused(enc);
  240. switch (tok) {
  241. case XML_TOK_PROLOG_S:
  242. return XML_ROLE_NONE;
  243. case XML_TOK_LITERAL:
  244. state->handler = doctype4;
  245. return XML_ROLE_DOCTYPE_SYSTEM_ID;
  246. }
  247. return common(state, tok);
  248. }
  249. static
  250. int doctype4(PROLOG_STATE *state,
  251. int tok,
  252. const char *ptr,
  253. const char *end,
  254. const ENCODING *enc)
  255. {
  256. cmExpatUnused(ptr);
  257. cmExpatUnused(end);
  258. cmExpatUnused(enc);
  259. switch (tok) {
  260. case XML_TOK_PROLOG_S:
  261. return XML_ROLE_NONE;
  262. case XML_TOK_OPEN_BRACKET:
  263. state->handler = internalSubset;
  264. return XML_ROLE_DOCTYPE_INTERNAL_SUBSET;
  265. case XML_TOK_DECL_CLOSE:
  266. state->handler = prolog2;
  267. return XML_ROLE_DOCTYPE_CLOSE;
  268. }
  269. return common(state, tok);
  270. }
  271. static
  272. int doctype5(PROLOG_STATE *state,
  273. int tok,
  274. const char *ptr,
  275. const char *end,
  276. const ENCODING *enc)
  277. {
  278. cmExpatUnused(ptr);
  279. cmExpatUnused(end);
  280. cmExpatUnused(enc);
  281. switch (tok) {
  282. case XML_TOK_PROLOG_S:
  283. return XML_ROLE_NONE;
  284. case XML_TOK_DECL_CLOSE:
  285. state->handler = prolog2;
  286. return XML_ROLE_DOCTYPE_CLOSE;
  287. }
  288. return common(state, tok);
  289. }
  290. static
  291. int internalSubset(PROLOG_STATE *state,
  292. int tok,
  293. const char *ptr,
  294. const char *end,
  295. const ENCODING *enc)
  296. {
  297. switch (tok) {
  298. case XML_TOK_PROLOG_S:
  299. return XML_ROLE_NONE;
  300. case XML_TOK_DECL_OPEN:
  301. if (XmlNameMatchesAscii(enc,
  302. ptr + 2 * MIN_BYTES_PER_CHAR(enc),
  303. end,
  304. KW_ENTITY)) {
  305. state->handler = entity0;
  306. return XML_ROLE_NONE;
  307. }
  308. if (XmlNameMatchesAscii(enc,
  309. ptr + 2 * MIN_BYTES_PER_CHAR(enc),
  310. end,
  311. KW_ATTLIST)) {
  312. state->handler = attlist0;
  313. return XML_ROLE_NONE;
  314. }
  315. if (XmlNameMatchesAscii(enc,
  316. ptr + 2 * MIN_BYTES_PER_CHAR(enc),
  317. end,
  318. KW_ELEMENT)) {
  319. state->handler = element0;
  320. return XML_ROLE_NONE;
  321. }
  322. if (XmlNameMatchesAscii(enc,
  323. ptr + 2 * MIN_BYTES_PER_CHAR(enc),
  324. end,
  325. KW_NOTATION)) {
  326. state->handler = notation0;
  327. return XML_ROLE_NONE;
  328. }
  329. break;
  330. case XML_TOK_PI:
  331. case XML_TOK_COMMENT:
  332. return XML_ROLE_NONE;
  333. case XML_TOK_PARAM_ENTITY_REF:
  334. return XML_ROLE_PARAM_ENTITY_REF;
  335. case XML_TOK_CLOSE_BRACKET:
  336. state->handler = doctype5;
  337. return XML_ROLE_NONE;
  338. }
  339. return common(state, tok);
  340. }
  341. #ifdef XML_DTD
  342. static
  343. int externalSubset0(PROLOG_STATE *state,
  344. int tok,
  345. const char *ptr,
  346. const char *end,
  347. const ENCODING *enc)
  348. {
  349. state->handler = externalSubset1;
  350. if (tok == XML_TOK_XML_DECL)
  351. return XML_ROLE_TEXT_DECL;
  352. return externalSubset1(state, tok, ptr, end, enc);
  353. }
  354. static
  355. int externalSubset1(PROLOG_STATE *state,
  356. int tok,
  357. const char *ptr,
  358. const char *end,
  359. const ENCODING *enc)
  360. {
  361. switch (tok) {
  362. case XML_TOK_COND_SECT_OPEN:
  363. state->handler = condSect0;
  364. return XML_ROLE_NONE;
  365. case XML_TOK_COND_SECT_CLOSE:
  366. if (state->includeLevel == 0)
  367. break;
  368. state->includeLevel -= 1;
  369. return XML_ROLE_NONE;
  370. case XML_TOK_PROLOG_S:
  371. return XML_ROLE_NONE;
  372. case XML_TOK_CLOSE_BRACKET:
  373. break;
  374. case XML_TOK_NONE:
  375. if (state->includeLevel)
  376. break;
  377. return XML_ROLE_NONE;
  378. default:
  379. return internalSubset(state, tok, ptr, end, enc);
  380. }
  381. return common(state, tok);
  382. }
  383. #endif /* XML_DTD */
  384. static
  385. int entity0(PROLOG_STATE *state,
  386. int tok,
  387. const char *ptr,
  388. const char *end,
  389. const ENCODING *enc)
  390. {
  391. cmExpatUnused(ptr);
  392. cmExpatUnused(end);
  393. cmExpatUnused(enc);
  394. switch (tok) {
  395. case XML_TOK_PROLOG_S:
  396. return XML_ROLE_NONE;
  397. case XML_TOK_PERCENT:
  398. state->handler = entity1;
  399. return XML_ROLE_NONE;
  400. case XML_TOK_NAME:
  401. state->handler = entity2;
  402. return XML_ROLE_GENERAL_ENTITY_NAME;
  403. }
  404. return common(state, tok);
  405. }
  406. static
  407. int entity1(PROLOG_STATE *state,
  408. int tok,
  409. const char *ptr,
  410. const char *end,
  411. const ENCODING *enc)
  412. {
  413. cmExpatUnused(ptr);
  414. cmExpatUnused(end);
  415. cmExpatUnused(enc);
  416. switch (tok) {
  417. case XML_TOK_PROLOG_S:
  418. return XML_ROLE_NONE;
  419. case XML_TOK_NAME:
  420. state->handler = entity7;
  421. return XML_ROLE_PARAM_ENTITY_NAME;
  422. }
  423. return common(state, tok);
  424. }
  425. static
  426. int entity2(PROLOG_STATE *state,
  427. int tok,
  428. const char *ptr,
  429. const char *end,
  430. const ENCODING *enc)
  431. {
  432. switch (tok) {
  433. case XML_TOK_PROLOG_S:
  434. return XML_ROLE_NONE;
  435. case XML_TOK_NAME:
  436. if (XmlNameMatchesAscii(enc, ptr, end, KW_SYSTEM)) {
  437. state->handler = entity4;
  438. return XML_ROLE_NONE;
  439. }
  440. if (XmlNameMatchesAscii(enc, ptr, end, KW_PUBLIC)) {
  441. state->handler = entity3;
  442. return XML_ROLE_NONE;
  443. }
  444. break;
  445. case XML_TOK_LITERAL:
  446. state->handler = declClose;
  447. return XML_ROLE_ENTITY_VALUE;
  448. }
  449. return common(state, tok);
  450. }
  451. static
  452. int entity3(PROLOG_STATE *state,
  453. int tok,
  454. const char *ptr,
  455. const char *end,
  456. const ENCODING *enc)
  457. {
  458. cmExpatUnused(ptr);
  459. cmExpatUnused(end);
  460. cmExpatUnused(enc);
  461. switch (tok) {
  462. case XML_TOK_PROLOG_S:
  463. return XML_ROLE_NONE;
  464. case XML_TOK_LITERAL:
  465. state->handler = entity4;
  466. return XML_ROLE_ENTITY_PUBLIC_ID;
  467. }
  468. return common(state, tok);
  469. }
  470. static
  471. int entity4(PROLOG_STATE *state,
  472. int tok,
  473. const char *ptr,
  474. const char *end,
  475. const ENCODING *enc)
  476. {
  477. cmExpatUnused(ptr);
  478. cmExpatUnused(end);
  479. cmExpatUnused(enc);
  480. switch (tok) {
  481. case XML_TOK_PROLOG_S:
  482. return XML_ROLE_NONE;
  483. case XML_TOK_LITERAL:
  484. state->handler = entity5;
  485. return XML_ROLE_ENTITY_SYSTEM_ID;
  486. }
  487. return common(state, tok);
  488. }
  489. static
  490. int entity5(PROLOG_STATE *state,
  491. int tok,
  492. const char *ptr,
  493. const char *end,
  494. const ENCODING *enc)
  495. {
  496. switch (tok) {
  497. case XML_TOK_PROLOG_S:
  498. return XML_ROLE_NONE;
  499. case XML_TOK_DECL_CLOSE:
  500. setTopLevel(state);
  501. return XML_ROLE_ENTITY_COMPLETE;
  502. case XML_TOK_NAME:
  503. if (XmlNameMatchesAscii(enc, ptr, end, KW_NDATA)) {
  504. state->handler = entity6;
  505. return XML_ROLE_NONE;
  506. }
  507. break;
  508. }
  509. return common(state, tok);
  510. }
  511. static
  512. int entity6(PROLOG_STATE *state,
  513. int tok,
  514. const char *ptr,
  515. const char *end,
  516. const ENCODING *enc)
  517. {
  518. cmExpatUnused(ptr);
  519. cmExpatUnused(end);
  520. cmExpatUnused(enc);
  521. switch (tok) {
  522. case XML_TOK_PROLOG_S:
  523. return XML_ROLE_NONE;
  524. case XML_TOK_NAME:
  525. state->handler = declClose;
  526. return XML_ROLE_ENTITY_NOTATION_NAME;
  527. }
  528. return common(state, tok);
  529. }
  530. static
  531. int entity7(PROLOG_STATE *state,
  532. int tok,
  533. const char *ptr,
  534. const char *end,
  535. const ENCODING *enc)
  536. {
  537. switch (tok) {
  538. case XML_TOK_PROLOG_S:
  539. return XML_ROLE_NONE;
  540. case XML_TOK_NAME:
  541. if (XmlNameMatchesAscii(enc, ptr, end, KW_SYSTEM)) {
  542. state->handler = entity9;
  543. return XML_ROLE_NONE;
  544. }
  545. if (XmlNameMatchesAscii(enc, ptr, end, KW_PUBLIC)) {
  546. state->handler = entity8;
  547. return XML_ROLE_NONE;
  548. }
  549. break;
  550. case XML_TOK_LITERAL:
  551. state->handler = declClose;
  552. return XML_ROLE_ENTITY_VALUE;
  553. }
  554. return common(state, tok);
  555. }
  556. static
  557. int entity8(PROLOG_STATE *state,
  558. int tok,
  559. const char *ptr,
  560. const char *end,
  561. const ENCODING *enc)
  562. {
  563. cmExpatUnused(ptr);
  564. cmExpatUnused(end);
  565. cmExpatUnused(enc);
  566. switch (tok) {
  567. case XML_TOK_PROLOG_S:
  568. return XML_ROLE_NONE;
  569. case XML_TOK_LITERAL:
  570. state->handler = entity9;
  571. return XML_ROLE_ENTITY_PUBLIC_ID;
  572. }
  573. return common(state, tok);
  574. }
  575. static
  576. int entity9(PROLOG_STATE *state,
  577. int tok,
  578. const char *ptr,
  579. const char *end,
  580. const ENCODING *enc)
  581. {
  582. cmExpatUnused(ptr);
  583. cmExpatUnused(end);
  584. cmExpatUnused(enc);
  585. switch (tok) {
  586. case XML_TOK_PROLOG_S:
  587. return XML_ROLE_NONE;
  588. case XML_TOK_LITERAL:
  589. state->handler = declClose;
  590. return XML_ROLE_ENTITY_SYSTEM_ID;
  591. }
  592. return common(state, tok);
  593. }
  594. static
  595. int notation0(PROLOG_STATE *state,
  596. int tok,
  597. const char *ptr,
  598. const char *end,
  599. const ENCODING *enc)
  600. {
  601. cmExpatUnused(ptr);
  602. cmExpatUnused(end);
  603. cmExpatUnused(enc);
  604. switch (tok) {
  605. case XML_TOK_PROLOG_S:
  606. return XML_ROLE_NONE;
  607. case XML_TOK_NAME:
  608. state->handler = notation1;
  609. return XML_ROLE_NOTATION_NAME;
  610. }
  611. return common(state, tok);
  612. }
  613. static
  614. int notation1(PROLOG_STATE *state,
  615. int tok,
  616. const char *ptr,
  617. const char *end,
  618. const ENCODING *enc)
  619. {
  620. switch (tok) {
  621. case XML_TOK_PROLOG_S:
  622. return XML_ROLE_NONE;
  623. case XML_TOK_NAME:
  624. if (XmlNameMatchesAscii(enc, ptr, end, KW_SYSTEM)) {
  625. state->handler = notation3;
  626. return XML_ROLE_NONE;
  627. }
  628. if (XmlNameMatchesAscii(enc, ptr, end, KW_PUBLIC)) {
  629. state->handler = notation2;
  630. return XML_ROLE_NONE;
  631. }
  632. break;
  633. }
  634. return common(state, tok);
  635. }
  636. static
  637. int notation2(PROLOG_STATE *state,
  638. int tok,
  639. const char *ptr,
  640. const char *end,
  641. const ENCODING *enc)
  642. {
  643. cmExpatUnused(ptr);
  644. cmExpatUnused(end);
  645. cmExpatUnused(enc);
  646. switch (tok) {
  647. case XML_TOK_PROLOG_S:
  648. return XML_ROLE_NONE;
  649. case XML_TOK_LITERAL:
  650. state->handler = notation4;
  651. return XML_ROLE_NOTATION_PUBLIC_ID;
  652. }
  653. return common(state, tok);
  654. }
  655. static
  656. int notation3(PROLOG_STATE *state,
  657. int tok,
  658. const char *ptr,
  659. const char *end,
  660. const ENCODING *enc)
  661. {
  662. cmExpatUnused(ptr);
  663. cmExpatUnused(end);
  664. cmExpatUnused(enc);
  665. switch (tok) {
  666. case XML_TOK_PROLOG_S:
  667. return XML_ROLE_NONE;
  668. case XML_TOK_LITERAL:
  669. state->handler = declClose;
  670. return XML_ROLE_NOTATION_SYSTEM_ID;
  671. }
  672. return common(state, tok);
  673. }
  674. static
  675. int notation4(PROLOG_STATE *state,
  676. int tok,
  677. const char *ptr,
  678. const char *end,
  679. const ENCODING *enc)
  680. {
  681. cmExpatUnused(ptr);
  682. cmExpatUnused(end);
  683. cmExpatUnused(enc);
  684. switch (tok) {
  685. case XML_TOK_PROLOG_S:
  686. return XML_ROLE_NONE;
  687. case XML_TOK_LITERAL:
  688. state->handler = declClose;
  689. return XML_ROLE_NOTATION_SYSTEM_ID;
  690. case XML_TOK_DECL_CLOSE:
  691. setTopLevel(state);
  692. return XML_ROLE_NOTATION_NO_SYSTEM_ID;
  693. }
  694. return common(state, tok);
  695. }
  696. static
  697. int attlist0(PROLOG_STATE *state,
  698. int tok,
  699. const char *ptr,
  700. const char *end,
  701. const ENCODING *enc)
  702. {
  703. cmExpatUnused(ptr);
  704. cmExpatUnused(end);
  705. cmExpatUnused(enc);
  706. switch (tok) {
  707. case XML_TOK_PROLOG_S:
  708. return XML_ROLE_NONE;
  709. case XML_TOK_NAME:
  710. case XML_TOK_PREFIXED_NAME:
  711. state->handler = attlist1;
  712. return XML_ROLE_ATTLIST_ELEMENT_NAME;
  713. }
  714. return common(state, tok);
  715. }
  716. static
  717. int attlist1(PROLOG_STATE *state,
  718. int tok,
  719. const char *ptr,
  720. const char *end,
  721. const ENCODING *enc)
  722. {
  723. cmExpatUnused(ptr);
  724. cmExpatUnused(end);
  725. cmExpatUnused(enc);
  726. switch (tok) {
  727. case XML_TOK_PROLOG_S:
  728. return XML_ROLE_NONE;
  729. case XML_TOK_DECL_CLOSE:
  730. setTopLevel(state);
  731. return XML_ROLE_NONE;
  732. case XML_TOK_NAME:
  733. case XML_TOK_PREFIXED_NAME:
  734. state->handler = attlist2;
  735. return XML_ROLE_ATTRIBUTE_NAME;
  736. }
  737. return common(state, tok);
  738. }
  739. static
  740. int attlist2(PROLOG_STATE *state,
  741. int tok,
  742. const char *ptr,
  743. const char *end,
  744. const ENCODING *enc)
  745. {
  746. cmExpatUnused(ptr);
  747. cmExpatUnused(end);
  748. cmExpatUnused(enc);
  749. switch (tok) {
  750. case XML_TOK_PROLOG_S:
  751. return XML_ROLE_NONE;
  752. case XML_TOK_NAME:
  753. {
  754. static const char *types[] = {
  755. KW_CDATA,
  756. KW_ID,
  757. KW_IDREF,
  758. KW_IDREFS,
  759. KW_ENTITY,
  760. KW_ENTITIES,
  761. KW_NMTOKEN,
  762. KW_NMTOKENS,
  763. };
  764. int i;
  765. for (i = 0; i < (int)(sizeof(types)/sizeof(types[0])); i++)
  766. if (XmlNameMatchesAscii(enc, ptr, end, types[i])) {
  767. state->handler = attlist8;
  768. return XML_ROLE_ATTRIBUTE_TYPE_CDATA + i;
  769. }
  770. }
  771. if (XmlNameMatchesAscii(enc, ptr, end, KW_NOTATION)) {
  772. state->handler = attlist5;
  773. return XML_ROLE_NONE;
  774. }
  775. break;
  776. case XML_TOK_OPEN_PAREN:
  777. state->handler = attlist3;
  778. return XML_ROLE_NONE;
  779. }
  780. return common(state, tok);
  781. }
  782. static
  783. int attlist3(PROLOG_STATE *state,
  784. int tok,
  785. const char *ptr,
  786. const char *end,
  787. const ENCODING *enc)
  788. {
  789. cmExpatUnused(ptr);
  790. cmExpatUnused(end);
  791. cmExpatUnused(enc);
  792. switch (tok) {
  793. case XML_TOK_PROLOG_S:
  794. return XML_ROLE_NONE;
  795. case XML_TOK_NMTOKEN:
  796. case XML_TOK_NAME:
  797. case XML_TOK_PREFIXED_NAME:
  798. state->handler = attlist4;
  799. return XML_ROLE_ATTRIBUTE_ENUM_VALUE;
  800. }
  801. return common(state, tok);
  802. }
  803. static
  804. int attlist4(PROLOG_STATE *state,
  805. int tok,
  806. const char *ptr,
  807. const char *end,
  808. const ENCODING *enc)
  809. {
  810. cmExpatUnused(ptr);
  811. cmExpatUnused(end);
  812. cmExpatUnused(enc);
  813. switch (tok) {
  814. case XML_TOK_PROLOG_S:
  815. return XML_ROLE_NONE;
  816. case XML_TOK_CLOSE_PAREN:
  817. state->handler = attlist8;
  818. return XML_ROLE_NONE;
  819. case XML_TOK_OR:
  820. state->handler = attlist3;
  821. return XML_ROLE_NONE;
  822. }
  823. return common(state, tok);
  824. }
  825. static
  826. int attlist5(PROLOG_STATE *state,
  827. int tok,
  828. const char *ptr,
  829. const char *end,
  830. const ENCODING *enc)
  831. {
  832. cmExpatUnused(ptr);
  833. cmExpatUnused(end);
  834. cmExpatUnused(enc);
  835. switch (tok) {
  836. case XML_TOK_PROLOG_S:
  837. return XML_ROLE_NONE;
  838. case XML_TOK_OPEN_PAREN:
  839. state->handler = attlist6;
  840. return XML_ROLE_NONE;
  841. }
  842. return common(state, tok);
  843. }
  844. static
  845. int attlist6(PROLOG_STATE *state,
  846. int tok,
  847. const char *ptr,
  848. const char *end,
  849. const ENCODING *enc)
  850. {
  851. cmExpatUnused(ptr);
  852. cmExpatUnused(end);
  853. cmExpatUnused(enc);
  854. switch (tok) {
  855. case XML_TOK_PROLOG_S:
  856. return XML_ROLE_NONE;
  857. case XML_TOK_NAME:
  858. state->handler = attlist7;
  859. return XML_ROLE_ATTRIBUTE_NOTATION_VALUE;
  860. }
  861. return common(state, tok);
  862. }
  863. static
  864. int attlist7(PROLOG_STATE *state,
  865. int tok,
  866. const char *ptr,
  867. const char *end,
  868. const ENCODING *enc)
  869. {
  870. cmExpatUnused(ptr);
  871. cmExpatUnused(end);
  872. cmExpatUnused(enc);
  873. switch (tok) {
  874. case XML_TOK_PROLOG_S:
  875. return XML_ROLE_NONE;
  876. case XML_TOK_CLOSE_PAREN:
  877. state->handler = attlist8;
  878. return XML_ROLE_NONE;
  879. case XML_TOK_OR:
  880. state->handler = attlist6;
  881. return XML_ROLE_NONE;
  882. }
  883. return common(state, tok);
  884. }
  885. /* default value */
  886. static
  887. int attlist8(PROLOG_STATE *state,
  888. int tok,
  889. const char *ptr,
  890. const char *end,
  891. const ENCODING *enc)
  892. {
  893. cmExpatUnused(ptr);
  894. cmExpatUnused(end);
  895. cmExpatUnused(enc);
  896. switch (tok) {
  897. case XML_TOK_PROLOG_S:
  898. return XML_ROLE_NONE;
  899. case XML_TOK_POUND_NAME:
  900. if (XmlNameMatchesAscii(enc,
  901. ptr + MIN_BYTES_PER_CHAR(enc),
  902. end,
  903. KW_IMPLIED)) {
  904. state->handler = attlist1;
  905. return XML_ROLE_IMPLIED_ATTRIBUTE_VALUE;
  906. }
  907. if (XmlNameMatchesAscii(enc,
  908. ptr + MIN_BYTES_PER_CHAR(enc),
  909. end,
  910. KW_REQUIRED)) {
  911. state->handler = attlist1;
  912. return XML_ROLE_REQUIRED_ATTRIBUTE_VALUE;
  913. }
  914. if (XmlNameMatchesAscii(enc,
  915. ptr + MIN_BYTES_PER_CHAR(enc),
  916. end,
  917. KW_FIXED)) {
  918. state->handler = attlist9;
  919. return XML_ROLE_NONE;
  920. }
  921. break;
  922. case XML_TOK_LITERAL:
  923. state->handler = attlist1;
  924. return XML_ROLE_DEFAULT_ATTRIBUTE_VALUE;
  925. }
  926. return common(state, tok);
  927. }
  928. static
  929. int attlist9(PROLOG_STATE *state,
  930. int tok,
  931. const char *ptr,
  932. const char *end,
  933. const ENCODING *enc)
  934. {
  935. cmExpatUnused(ptr);
  936. cmExpatUnused(end);
  937. cmExpatUnused(enc);
  938. switch (tok) {
  939. case XML_TOK_PROLOG_S:
  940. return XML_ROLE_NONE;
  941. case XML_TOK_LITERAL:
  942. state->handler = attlist1;
  943. return XML_ROLE_FIXED_ATTRIBUTE_VALUE;
  944. }
  945. return common(state, tok);
  946. }
  947. static
  948. int element0(PROLOG_STATE *state,
  949. int tok,
  950. const char *ptr,
  951. const char *end,
  952. const ENCODING *enc)
  953. {
  954. cmExpatUnused(ptr);
  955. cmExpatUnused(end);
  956. cmExpatUnused(enc);
  957. switch (tok) {
  958. case XML_TOK_PROLOG_S:
  959. return XML_ROLE_NONE;
  960. case XML_TOK_NAME:
  961. case XML_TOK_PREFIXED_NAME:
  962. state->handler = element1;
  963. return XML_ROLE_ELEMENT_NAME;
  964. }
  965. return common(state, tok);
  966. }
  967. static
  968. int element1(PROLOG_STATE *state,
  969. int tok,
  970. const char *ptr,
  971. const char *end,
  972. const ENCODING *enc)
  973. {
  974. cmExpatUnused(ptr);
  975. cmExpatUnused(end);
  976. cmExpatUnused(enc);
  977. switch (tok) {
  978. case XML_TOK_PROLOG_S:
  979. return XML_ROLE_NONE;
  980. case XML_TOK_NAME:
  981. if (XmlNameMatchesAscii(enc, ptr, end, KW_EMPTY)) {
  982. state->handler = declClose;
  983. return XML_ROLE_CONTENT_EMPTY;
  984. }
  985. if (XmlNameMatchesAscii(enc, ptr, end, KW_ANY)) {
  986. state->handler = declClose;
  987. return XML_ROLE_CONTENT_ANY;
  988. }
  989. break;
  990. case XML_TOK_OPEN_PAREN:
  991. state->handler = element2;
  992. state->level = 1;
  993. return XML_ROLE_GROUP_OPEN;
  994. }
  995. return common(state, tok);
  996. }
  997. static
  998. int element2(PROLOG_STATE *state,
  999. int tok,
  1000. const char *ptr,
  1001. const char *end,
  1002. const ENCODING *enc)
  1003. {
  1004. cmExpatUnused(ptr);
  1005. cmExpatUnused(end);
  1006. cmExpatUnused(enc);
  1007. switch (tok) {
  1008. case XML_TOK_PROLOG_S:
  1009. return XML_ROLE_NONE;
  1010. case XML_TOK_POUND_NAME:
  1011. if (XmlNameMatchesAscii(enc,
  1012. ptr + MIN_BYTES_PER_CHAR(enc),
  1013. end,
  1014. KW_PCDATA)) {
  1015. state->handler = element3;
  1016. return XML_ROLE_CONTENT_PCDATA;
  1017. }
  1018. break;
  1019. case XML_TOK_OPEN_PAREN:
  1020. state->level = 2;
  1021. state->handler = element6;
  1022. return XML_ROLE_GROUP_OPEN;
  1023. case XML_TOK_NAME:
  1024. case XML_TOK_PREFIXED_NAME:
  1025. state->handler = element7;
  1026. return XML_ROLE_CONTENT_ELEMENT;
  1027. case XML_TOK_NAME_QUESTION:
  1028. state->handler = element7;
  1029. return XML_ROLE_CONTENT_ELEMENT_OPT;
  1030. case XML_TOK_NAME_ASTERISK:
  1031. state->handler = element7;
  1032. return XML_ROLE_CONTENT_ELEMENT_REP;
  1033. case XML_TOK_NAME_PLUS:
  1034. state->handler = element7;
  1035. return XML_ROLE_CONTENT_ELEMENT_PLUS;
  1036. }
  1037. return common(state, tok);
  1038. }
  1039. static
  1040. int element3(PROLOG_STATE *state,
  1041. int tok,
  1042. const char *ptr,
  1043. const char *end,
  1044. const ENCODING *enc)
  1045. {
  1046. cmExpatUnused(ptr);
  1047. cmExpatUnused(end);
  1048. cmExpatUnused(enc);
  1049. switch (tok) {
  1050. case XML_TOK_PROLOG_S:
  1051. return XML_ROLE_NONE;
  1052. case XML_TOK_CLOSE_PAREN:
  1053. state->handler = declClose;
  1054. return XML_ROLE_GROUP_CLOSE;
  1055. case XML_TOK_CLOSE_PAREN_ASTERISK:
  1056. state->handler = declClose;
  1057. return XML_ROLE_GROUP_CLOSE_REP;
  1058. case XML_TOK_OR:
  1059. state->handler = element4;
  1060. return XML_ROLE_NONE;
  1061. }
  1062. return common(state, tok);
  1063. }
  1064. static
  1065. int element4(PROLOG_STATE *state,
  1066. int tok,
  1067. const char *ptr,
  1068. const char *end,
  1069. const ENCODING *enc)
  1070. {
  1071. cmExpatUnused(ptr);
  1072. cmExpatUnused(end);
  1073. cmExpatUnused(enc);
  1074. switch (tok) {
  1075. case XML_TOK_PROLOG_S:
  1076. return XML_ROLE_NONE;
  1077. case XML_TOK_NAME:
  1078. case XML_TOK_PREFIXED_NAME:
  1079. state->handler = element5;
  1080. return XML_ROLE_CONTENT_ELEMENT;
  1081. }
  1082. return common(state, tok);
  1083. }
  1084. static
  1085. int element5(PROLOG_STATE *state,
  1086. int tok,
  1087. const char *ptr,
  1088. const char *end,
  1089. const ENCODING *enc)
  1090. {
  1091. cmExpatUnused(ptr);
  1092. cmExpatUnused(end);
  1093. cmExpatUnused(enc);
  1094. switch (tok) {
  1095. case XML_TOK_PROLOG_S:
  1096. return XML_ROLE_NONE;
  1097. case XML_TOK_CLOSE_PAREN_ASTERISK:
  1098. state->handler = declClose;
  1099. return XML_ROLE_GROUP_CLOSE_REP;
  1100. case XML_TOK_OR:
  1101. state->handler = element4;
  1102. return XML_ROLE_NONE;
  1103. }
  1104. return common(state, tok);
  1105. }
  1106. static
  1107. int element6(PROLOG_STATE *state,
  1108. int tok,
  1109. const char *ptr,
  1110. const char *end,
  1111. const ENCODING *enc)
  1112. {
  1113. cmExpatUnused(ptr);
  1114. cmExpatUnused(end);
  1115. cmExpatUnused(enc);
  1116. switch (tok) {
  1117. case XML_TOK_PROLOG_S:
  1118. return XML_ROLE_NONE;
  1119. case XML_TOK_OPEN_PAREN:
  1120. state->level += 1;
  1121. return XML_ROLE_GROUP_OPEN;
  1122. case XML_TOK_NAME:
  1123. case XML_TOK_PREFIXED_NAME:
  1124. state->handler = element7;
  1125. return XML_ROLE_CONTENT_ELEMENT;
  1126. case XML_TOK_NAME_QUESTION:
  1127. state->handler = element7;
  1128. return XML_ROLE_CONTENT_ELEMENT_OPT;
  1129. case XML_TOK_NAME_ASTERISK:
  1130. state->handler = element7;
  1131. return XML_ROLE_CONTENT_ELEMENT_REP;
  1132. case XML_TOK_NAME_PLUS:
  1133. state->handler = element7;
  1134. return XML_ROLE_CONTENT_ELEMENT_PLUS;
  1135. }
  1136. return common(state, tok);
  1137. }
  1138. static
  1139. int element7(PROLOG_STATE *state,
  1140. int tok,
  1141. const char *ptr,
  1142. const char *end,
  1143. const ENCODING *enc)
  1144. {
  1145. cmExpatUnused(ptr);
  1146. cmExpatUnused(end);
  1147. cmExpatUnused(enc);
  1148. switch (tok) {
  1149. case XML_TOK_PROLOG_S:
  1150. return XML_ROLE_NONE;
  1151. case XML_TOK_CLOSE_PAREN:
  1152. state->level -= 1;
  1153. if (state->level == 0)
  1154. state->handler = declClose;
  1155. return XML_ROLE_GROUP_CLOSE;
  1156. case XML_TOK_CLOSE_PAREN_ASTERISK:
  1157. state->level -= 1;
  1158. if (state->level == 0)
  1159. state->handler = declClose;
  1160. return XML_ROLE_GROUP_CLOSE_REP;
  1161. case XML_TOK_CLOSE_PAREN_QUESTION:
  1162. state->level -= 1;
  1163. if (state->level == 0)
  1164. state->handler = declClose;
  1165. return XML_ROLE_GROUP_CLOSE_OPT;
  1166. case XML_TOK_CLOSE_PAREN_PLUS:
  1167. state->level -= 1;
  1168. if (state->level == 0)
  1169. state->handler = declClose;
  1170. return XML_ROLE_GROUP_CLOSE_PLUS;
  1171. case XML_TOK_COMMA:
  1172. state->handler = element6;
  1173. return XML_ROLE_GROUP_SEQUENCE;
  1174. case XML_TOK_OR:
  1175. state->handler = element6;
  1176. return XML_ROLE_GROUP_CHOICE;
  1177. }
  1178. return common(state, tok);
  1179. }
  1180. #ifdef XML_DTD
  1181. static
  1182. int condSect0(PROLOG_STATE *state,
  1183. int tok,
  1184. const char *ptr,
  1185. const char *end,
  1186. const ENCODING *enc)
  1187. {
  1188. cmExpatUnused(ptr);
  1189. cmExpatUnused(end);
  1190. cmExpatUnused(enc);
  1191. switch (tok) {
  1192. case XML_TOK_PROLOG_S:
  1193. return XML_ROLE_NONE;
  1194. case XML_TOK_NAME:
  1195. if (XmlNameMatchesAscii(enc, ptr, end, KW_INCLUDE)) {
  1196. state->handler = condSect1;
  1197. return XML_ROLE_NONE;
  1198. }
  1199. if (XmlNameMatchesAscii(enc, ptr, end, KW_IGNORE)) {
  1200. state->handler = condSect2;
  1201. return XML_ROLE_NONE;
  1202. }
  1203. break;
  1204. }
  1205. return common(state, tok);
  1206. }
  1207. static
  1208. int condSect1(PROLOG_STATE *state,
  1209. int tok,
  1210. const char *ptr,
  1211. const char *end,
  1212. const ENCODING *enc)
  1213. {
  1214. cmExpatUnused(ptr);
  1215. cmExpatUnused(end);
  1216. cmExpatUnused(enc);
  1217. switch (tok) {
  1218. case XML_TOK_PROLOG_S:
  1219. return XML_ROLE_NONE;
  1220. case XML_TOK_OPEN_BRACKET:
  1221. state->handler = externalSubset1;
  1222. state->includeLevel += 1;
  1223. return XML_ROLE_NONE;
  1224. }
  1225. return common(state, tok);
  1226. }
  1227. static
  1228. int condSect2(PROLOG_STATE *state,
  1229. int tok,
  1230. const char *ptr,
  1231. const char *end,
  1232. const ENCODING *enc)
  1233. {
  1234. cmExpatUnused(ptr);
  1235. cmExpatUnused(end);
  1236. cmExpatUnused(enc);
  1237. switch (tok) {
  1238. case XML_TOK_PROLOG_S:
  1239. return XML_ROLE_NONE;
  1240. case XML_TOK_OPEN_BRACKET:
  1241. state->handler = externalSubset1;
  1242. return XML_ROLE_IGNORE_SECT;
  1243. }
  1244. return common(state, tok);
  1245. }
  1246. #endif /* XML_DTD */
  1247. static
  1248. int declClose(PROLOG_STATE *state,
  1249. int tok,
  1250. const char *ptr,
  1251. const char *end,
  1252. const ENCODING *enc)
  1253. {
  1254. cmExpatUnused(ptr);
  1255. cmExpatUnused(end);
  1256. cmExpatUnused(enc);
  1257. switch (tok) {
  1258. case XML_TOK_PROLOG_S:
  1259. return XML_ROLE_NONE;
  1260. case XML_TOK_DECL_CLOSE:
  1261. setTopLevel(state);
  1262. return XML_ROLE_NONE;
  1263. }
  1264. return common(state, tok);
  1265. }
  1266. #if 0
  1267. static
  1268. int ignore(PROLOG_STATE *state,
  1269. int tok,
  1270. const char *ptr,
  1271. const char *end,
  1272. const ENCODING *enc)
  1273. {
  1274. cmExpatUnused(ptr);
  1275. cmExpatUnused(end);
  1276. cmExpatUnused(enc);
  1277. switch (tok) {
  1278. case XML_TOK_DECL_CLOSE:
  1279. state->handler = internalSubset;
  1280. return 0;
  1281. default:
  1282. return XML_ROLE_NONE;
  1283. }
  1284. return common(state, tok);
  1285. }
  1286. #endif
  1287. static
  1288. int error(PROLOG_STATE *state,
  1289. int tok,
  1290. const char *ptr,
  1291. const char *end,
  1292. const ENCODING *enc)
  1293. {
  1294. cmExpatUnused(state);
  1295. cmExpatUnused(tok);
  1296. cmExpatUnused(ptr);
  1297. cmExpatUnused(end);
  1298. cmExpatUnused(enc);
  1299. return XML_ROLE_NONE;
  1300. }
  1301. static
  1302. int common(PROLOG_STATE *state, int tok)
  1303. {
  1304. #ifdef XML_DTD
  1305. if (!state->documentEntity && tok == XML_TOK_PARAM_ENTITY_REF)
  1306. return XML_ROLE_INNER_PARAM_ENTITY_REF;
  1307. #endif
  1308. state->handler = error;
  1309. return XML_ROLE_ERROR;
  1310. }
  1311. void XmlPrologStateInit(PROLOG_STATE *state)
  1312. {
  1313. state->handler = prolog0;
  1314. #ifdef XML_DTD
  1315. state->documentEntity = 1;
  1316. state->includeLevel = 0;
  1317. #endif /* XML_DTD */
  1318. }
  1319. #ifdef XML_DTD
  1320. void XmlPrologStateInitExternalEntity(PROLOG_STATE *state)
  1321. {
  1322. state->handler = externalSubset0;
  1323. state->documentEntity = 0;
  1324. state->includeLevel = 0;
  1325. }
  1326. #endif /* XML_DTD */