00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022
00023
00024
00025
00026
00027
00028
00029
00030
00031
00032
00033
00034 #include <lestes/common.hh>
00035 #include <lestes/lang/cplus/lex/trigraphs.hh>
00036 #include <lestes/lang/cplus/lex/ucn_filter.hh>
00037 #include <lestes/lang/cplus/lex/lex_loggers.hh>
00038 #include <lestes/msg/logger.hh>
00039 #include <lestes/msg/logger_util.hh>
00040
00041
00042 package(lestes);
00043 package(lang);
00044 package(cplus);
00045 package(lex);
00046
00047 using namespace ::std;
00048
00049
00050
00051
00052
00053 trigraphs::trigraphs(void):
00054 ucn_filter(),
00055 state(START)
00056 {
00057 }
00058
00059
00060
00061
00062
00063 ptr<ucn_token> trigraphs::read(void)
00064 {
00065 trigraphs_logger << "trigraphs::read()\n" << msg::eolog;
00066 trigraphs_logger << "state == " << state["sqQ12"] << '\n' << msg::eolog;
00067
00068 ptr<ucn_token> t;
00069
00070 switch (state) {
00071 case ONE:
00072
00073 t = first;
00074
00075 first = NULL;
00076 state = START;
00077 trigraphs_logger << "return only saved\ntrigraphs::read() end\n" << msg::eolog;
00078 return t;
00079 case TWO:
00080
00081 t = first;
00082 first = second;
00083
00084 second = NULL;
00085 state = ONE;
00086 trigraphs_logger << "return first saved\ntrigraphs::read() end\n" << msg::eolog;
00087 return t;
00088 default:
00089 break;
00090 }
00091
00092 while (true) {
00093 t = input_read();
00094 ucn_token_type utt = t->type_get();
00095
00096
00097
00098
00099 switch (state) {
00100 case START:
00101 if (utt == ucn_token::TOK_BASIC && t->value_get() == character::ascii_qmark) {
00102
00103 state = QUE;
00104 first = t;
00105 } else {
00106 trigraphs_logger << "trigraphs::read() end\n" << msg::eolog;
00107 return t;
00108 }
00109 break;
00110 case QUE:
00111 if (utt == ucn_token::TOK_BASIC && t->value_get() == character::ascii_qmark) {
00112
00113 state = QUEQUE;
00114 second = t;
00115 } else {
00116 ptr<ucn_token> tmp;
00117
00118 tmp = first;
00119
00120 first = t;
00121 state = ONE;
00122 trigraphs_logger << "trigraphs::read() end\n" << msg::eolog;
00123 return tmp;
00124 }
00125 break;
00126 case QUEQUE:
00127
00128 if (utt == ucn_token::TOK_BASIC) {
00129 ucn u = t->value_get();
00130 ucn v = translation_map[character::extract_value(u)];
00131 if (v != 0) {
00132 t = first;
00133
00134 first = NULL;
00135 t = t->clone_value(v);
00136 state = START;
00137 trigraphs_logger << "trigraphs::read() end\n" << msg::eolog;
00138 return t;
00139 }
00140
00141
00142 state = u == character::ascii_qmark ? QUEQUE : TWO;
00143 } else {
00144
00145 state = TWO;
00146 }
00147
00148
00149 {
00150
00151 ptr<ucn_token> tmp = first;
00152 first = second;
00153 second = t;
00154 trigraphs_logger << "trigraphs::read() end\n" << msg::eolog;
00155 return tmp;
00156 }
00157 default:
00158 lassert2(false,"You should never get here");
00159 }
00160 trigraphs_logger << "state == " << state["sqQ12"] << '\n' << msg::eolog;
00161 }
00162 }
00163
00164
00165
00166
00167 void trigraphs::gc_mark(void)
00168 {
00169 first.gc_mark();
00170 second.gc_mark();
00171 ucn_filter::gc_mark();
00172 }
00173
00174
00175
00176
00177
00178 ptr<trigraphs> trigraphs::create(void)
00179 {
00180 return new trigraphs();
00181 }
00182
00183
00184
00185
00186
00187 const ucn trigraphs::translation_map[trigraphs::translation_length] = {
00188 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
00189 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
00190 character::ascii_vbar,
00191 0, 0, 0, 0, 0,
00192 character::ascii_hat,
00193 character::ascii_left_bracket,
00194 character::ascii_right_bracket,
00195 0, 0, 0,
00196 character::ascii_tilde,
00197 0,
00198 character::ascii_backslash,
00199 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
00200 character::ascii_left_brace,
00201 character::ascii_hash,
00202 character::ascii_right_brace,
00203 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
00204 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
00205 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
00206 0, 0, 0, 0, 0
00207 };
00208
00209 end_package(lex);
00210 end_package(cplus);
00211 end_package(lang);
00212 end_package(lestes);
00213
00214
00215