token.c 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241
  1. #include "__token.h"
  2. Token *makeToken(){
  3. Token *tmp = memCalloc(1, sizeof(Token));
  4. tmp->token_type = 0;
  5. tmp->data.str = NULL;
  6. tmp->data.st = NULL;
  7. tmp->data.second_str = NULL;
  8. return tmp;
  9. }
  10. Token *makeLexToken(int type, char *str, char *second_str) {
  11. struct Token *tmp = makeToken();
  12. tmp->token_type = type;
  13. tmp->data.str = memStrcpy(str, 0, false, false);
  14. tmp->data.second_str = memStrcpy(second_str, 0, false, false);
  15. return tmp;
  16. }
  17. Token *makeStatementToken(int type, struct Statement *st){
  18. struct Token *tmp = makeToken();
  19. tmp->token_type = type;
  20. tmp->data.st = st;
  21. return tmp;
  22. }
  23. void freeToken(Token *tk, bool self, bool error) {
  24. memFree(tk->data.str);
  25. memFree(tk->data.second_str);
  26. if (error){
  27. freeStatement(tk->data.st);
  28. }
  29. if (self){
  30. memFree(tk);
  31. }
  32. }
  33. TokenStream *makeTokenStream(){
  34. TokenStream *tmp = memCalloc(1, sizeof(TokenStream));
  35. tmp->size = 0;
  36. tmp->ahead = 0;
  37. tmp->token_list = NULL;
  38. tmp->token_ahead = NULL;
  39. return tmp;
  40. }
  41. void freeToekStream(TokenStream *ts, bool self) {
  42. for (int i=0; i < ts->size; i++){
  43. freeToken(ts->token_list[i], true, false);
  44. }
  45. for (int i=0; i < ts->ahead; i++){
  46. freeToken(ts->token_ahead[i], true, false);
  47. }
  48. memFree(ts->token_list);
  49. memFree(ts->token_ahead);
  50. if (self){
  51. memFree(ts);
  52. }
  53. }
  54. TokenMessage *makeTokenMessage(char *file_dir, char *debug) {
  55. TokenMessage *tm = memCalloc(1, sizeof(TokenMessage));
  56. tm->file = makeLexFile(file_dir);
  57. tm->mathers = makeMathers(MATHER_MAX);
  58. tm->ts = makeTokenStream();
  59. #if OUT_LOG
  60. if (debug != NULL){
  61. char *debug_dir = memStrcat(debug, LEXICAL_LOG);
  62. tm->debug = fopen(debug_dir, "w");
  63. memFree(debug_dir);
  64. }
  65. else{
  66. tm->debug = NULL;
  67. }
  68. #else
  69. tm->debug = NULL;
  70. #endif
  71. return tm;
  72. }
  73. void freeTokenMessage(TokenMessage *tm, bool self) {
  74. freeLexFile(tm->file, true);
  75. freeToekStream(tm->ts, true);
  76. freeMathers(tm->mathers, true);
  77. #if OUT_LOG
  78. if (tm->debug != NULL)
  79. fclose(tm->debug);
  80. #endif
  81. if (self){
  82. free(tm);
  83. }
  84. }
  85. /**
  86. * 添加一个token到token_list,token_ahend保持
  87. * @param ts
  88. * @param new_tk
  89. */
  90. void addToken(TokenStream *ts, Token *new_tk, FILE *debug) {
  91. printTokenEnter(new_tk, debug, DEBUG, "add Token: ");
  92. Token **new_list = memCalloc(ts->size + 1, sizeof(Token *));
  93. for (int i=0; i < ts->size; i++){
  94. new_list[i] = ts->token_list[i];
  95. }
  96. new_list[ts->size] = new_tk;
  97. ts->size ++;
  98. memFree(ts->token_list);
  99. ts->token_list = new_list;
  100. MACRO_printTokenStream(ts, debug, DEEP_DEBUG);
  101. }
  102. /**
  103. * 从token_list弹出一个token,保持token_ahend
  104. * @param ts
  105. * @return
  106. */
  107. Token *popToken(TokenStream *ts, FILE *debug) {
  108. Token **new_list = memCalloc(ts->size - 1, sizeof(Token *));
  109. for (int i=0; i < ts->size - 1; i++){
  110. new_list[i] = ts->token_list[i];
  111. }
  112. Token *tmp = ts->token_list[ts->size - 1];
  113. memFree(ts->token_list);
  114. ts->token_list = new_list;
  115. ts->size --;
  116. printTokenEnter(tmp, debug, DEBUG, "pop Token: ");
  117. MACRO_printTokenStream(ts, debug, DEEP_DEBUG);
  118. return tmp;
  119. }
  120. /**
  121. * 把token_list的一个token退回到token_ahend
  122. * @param ts
  123. * @return
  124. */
  125. Token *backToken(TokenStream *ts, FILE *debug) {
  126. Token **new_list = memCalloc(ts->size - 1, sizeof(Token *));
  127. Token **new_ahead = memCalloc(ts->ahead + 1, sizeof(Token *));
  128. for (int i=0; i < ts->size - 1; i++){
  129. new_list[i] = ts->token_list[i];
  130. }
  131. for (int i=0; i < ts->ahead; i++){
  132. new_ahead[i] = ts->token_ahead[i];
  133. }
  134. new_ahead[ts->ahead] = ts->token_list[ts->size - 1];
  135. memFree(ts->token_list);
  136. memFree(ts->token_ahead);
  137. ts->token_ahead = new_ahead;
  138. ts->token_list = new_list;
  139. ts->size --;
  140. ts->ahead ++;
  141. printTokenEnter(new_ahead[ts->ahead - 1], debug, DEBUG, "back Token: ");
  142. MACRO_printTokenStream(ts, debug, DEEP_DEBUG);
  143. return new_ahead[ts->ahead - 1];
  144. }
  145. /**
  146. * backToken的逆向操作
  147. * @param ts
  148. * @return
  149. */
  150. Token *forwardToken(TokenStream *ts, FILE *debug) {
  151. Token **new_list = memCalloc(ts->size + 1, sizeof(Token *));
  152. Token **new_ahead = memCalloc(ts->ahead - 1, sizeof(Token *));
  153. for (int i=0; i < ts->size; i++){
  154. new_list[i] = ts->token_list[i];
  155. }
  156. for (int i=0; i < ts->ahead - 1; i++){
  157. new_ahead[i] = ts->token_ahead[i];
  158. }
  159. new_list[ts->size] = ts->token_ahead[ts->ahead - 1];
  160. memFree(ts->token_list);
  161. memFree(ts->token_ahead);
  162. ts->token_ahead = new_ahead;
  163. ts->token_list = new_list;
  164. ts->size ++;
  165. ts->ahead --;
  166. printTokenEnter(new_list[ts->size - 1], debug, DEBUG, "forward Token: ");
  167. MACRO_printTokenStream(ts, debug, DEEP_DEBUG);
  168. return new_list[ts->size - 1];
  169. }
  170. /**
  171. * 获取token, 并且放入token_list中
  172. * 自动处理backToken
  173. * @param tm
  174. * @return 返回获取token的token_type
  175. */
  176. int safeGetToken(TokenMessage *tm, FILE *debug) {
  177. writeLog_(debug, DEBUG, "safe get token : ", NULL);
  178. Token *tmp;
  179. if (tm->ts->ahead == 0){
  180. writeLog_(debug, DEBUG, "get token: %d\n", tm->file->count);
  181. tmp = getToken(tm->file, tm->mathers, tm->debug);
  182. addToken(tm->ts, tmp, debug);
  183. MACRO_printTokenStream(tm->ts, debug, DEBUG);
  184. }
  185. else{
  186. // forwardToken 会有详细的日志输出
  187. tmp = forwardToken(tm->ts, debug);
  188. }
  189. return tmp->token_type;
  190. }
  191. void printToken(Token *tk, FILE *debug, int type) {
  192. if (tk->token_type >= 0) {
  193. char *tmp = tk->data.str, *second_tmp = tk->data.second_str;
  194. if (!strcmp(tmp, "\n")) {
  195. tmp = "\\n";
  196. }
  197. if (!strcmp(second_tmp, "\n")) {
  198. second_tmp = "\\n";
  199. }
  200. if (tmp[0] == EOF) {
  201. tmp = "(EOF)";
  202. }
  203. writeLog_(debug, type, "<token str = ('%s','%s'), type = %d>", tmp, second_tmp, tk->token_type);
  204. }
  205. else{
  206. writeLog_(debug, type, "<token statement, type = %d>", tk->token_type);
  207. }
  208. }
  209. void printTokenStream(TokenStream *ts, FILE *debug, int type) {
  210. writeLog_(debug, type, "token_list: ", NULL);
  211. for (int i=0; i < ts->size; i ++){
  212. if (i > 0)
  213. writeLog_(debug, type, "-", NULL);
  214. printToken(ts->token_list[i], debug, type);
  215. }
  216. writeLog_(debug, type, "\n", NULL);
  217. writeLog_(debug, type, "token_ahead: ", NULL);
  218. for (int i=0; i < ts->ahead; i ++){
  219. if (i > 0)
  220. writeLog_(debug, type, "-", NULL);
  221. printToken(ts->token_ahead[i], debug, type);
  222. }
  223. writeLog_(debug, type, "\n", NULL);
  224. }