All files / src/abap/1_lexer lexer.ts

96.83% Statements 306/316
94.89% Branches 186/196
100% Functions 3/3
96.83% Lines 306/316

Press n or j to go to the next uncovered block, b, p or k for the previous block.

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 3161x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 1x 1x 285623x 285623x 183272x 183272x 183272x 183272x 183272x 176961x 176961x 125894x 125894x 176961x 183272x 183272x 183272x 183272x 162353x 162353x 183272x 183272x 183272x 259x 259x 183272x 183272x 183272x 319x 183272x 2638x 182953x 650x 650x 650x 276x 650x 180x 374x 178x 194x 11x 16x 5x 5x 180315x 81x 179665x 62716x 28793x 62716x 238x   238x   238x 187x 238x 51x 51x 33923x 6020x 984x 6020x 431x 5036x 2493x 4605x 2112x 2112x 33685x 238x 151x 238x 36x 87x 46x 51x 5x 5x 27665x 6022x 3392x 6022x 72x 2630x 2539x 2558x 19x 19x 27427x 3988x 45x 3988x 22x 3943x 10x 3921x 3911x 3911x 21405x 269x 167x 269x 32x 102x 2x 70x 68x 68x 17417x 913x   913x 899x 913x   14x 14x 14x 913x 179584x 11465x 478x   478x 1x 478x   477x 477x 477x 11465x 465x 2x 465x   463x   463x 463x 463x 465x 11465x 183272x 183272x 132160x 132160x 183272x 183272x 285623x 285623x 1x 1x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 9088x 973584x 973584x 973584x 973584x 973584x 973584x 946248x 251049x 946248x 2483x 2483x 2483x 695199x 649x 649x 649x 692716x 155x 155x 155x 692067x 81x 81x 81x 691912x 691831x 314x 314x 314x 691831x 901x 691517x 690616x 465x 690616x 690151x 690151x 920x 920x 690151x 689231x 689231x 15914x 15914x 973584x 77x 77x 77x 27336x 27259x 27259x 27259x 27259x 27259x 155x 155x 155x 1x 155x 154x 154x 27259x 27104x 27104x 27104x 649x 649x 649x 27104x 26455x 26455x 1x 26455x 26454x 26454x 26454x 26454x 26454x 2476x 2476x 2476x 4x 2476x 2472x 2472x 26454x 246x 246x 23978x     973584x 973584x 9088x 9088x 973584x 9088x 9088x 9088x 1x 1x
import {IFile} from "../../files/_ifile";
import {Position} from "../../position";
import {VirtualPosition} from "../../virtual_position";
import {AbstractToken} from "./tokens/abstract_token";
import {IABAPLexerResult} from "./lexer_result";
import {At, AtW, BracketLeft, BracketLeftW, BracketRight, BracketRightW, Comment, Dash, DashW, Identifier, InstanceArrow, InstanceArrowW, ParenLeft, ParenLeftW, ParenRight, ParenRightW, Plus, PlusW, Pragma, Punctuation, StaticArrow, StaticArrowW, StringTemplate, StringTemplateBegin, StringTemplateEnd, StringTemplateMiddle, StringToken, WAt, WAtW, WBracketLeft, WBracketLeftW, WBracketRight, WBracketRightW, WDash, WDashW, WInstanceArrow, WInstanceArrowW, WParenLeft, WParenLeftW, WParenRight, WParenRightW, WPlus, WPlusW, WStaticArrow, WStaticArrowW} from "./tokens";
import {LexerBuffer} from "./lexer_buffer";
import {LexerStream} from "./lexer_stream";
 
const ModeNormal: number = 1;
const ModePing: number = 2;
const ModeStr: number = 3;
const ModeTemplate: number = 4;
const ModeComment: number = 5;
const ModePragma: number = 6;
 
export class Lexer {
 
  private virtual: Position | undefined;
  private tokens: AbstractToken[];
  private m: number;
  private stream: LexerStream;
  private buffer: LexerBuffer;
 
  public run(file: IFile, virtual?: Position): IABAPLexerResult {
    this.virtual = virtual;
    this.tokens = [];
    this.m = ModeNormal;
 
    this.process(file.getRaw());
    return {file, tokens: this.tokens};
  }
 
  private add() {
    const s = this.buffer.get().trim();
    if (s.length > 0) {
      const col = this.stream.getCol();
      const row = this.stream.getRow();
 
      let whiteBefore = false;
      if (this.stream.getOffset() - s.length >= 0) {
        const prev = this.stream.getRaw().substr(this.stream.getOffset() - s.length, 1);
        if (prev === " " || prev === "\n" || prev === "\t" || prev === ":") {
          whiteBefore = true;
        }
      }
 
      let whiteAfter = false;
      const next = this.stream.nextChar();
      if (next === " " || next === "\n" || next === "\t" || next === ":" || next === "," || next === "." || next === "" || next === "\"") {
        whiteAfter = true;
      }
 
      let pos = new Position(row, col - s.length);
      if (this.virtual) {
        pos = new VirtualPosition(this.virtual, pos.getRow(), pos.getCol());
      }
 
      let tok: AbstractToken | undefined = undefined;
      if (this.m === ModeComment) {
        tok = new Comment(pos, s);
      } else if (this.m === ModePing || this.m === ModeStr) {
        tok = new StringToken(pos, s);
      } else if (this.m === ModeTemplate) {
        const first = s.charAt(0);
        const last = s.charAt(s.length - 1);
        if (first === "|" && last === "|") {
          tok = new StringTemplate(pos, s);
        } else if (first === "|" && last === "{" && whiteAfter === true) {
          tok = new StringTemplateBegin(pos, s);
        } else if (first === "}" && last === "|" && whiteBefore === true) {
          tok = new StringTemplateEnd(pos, s);
        } else if (first === "}" && last === "{" && whiteAfter === true && whiteBefore === true) {
          tok = new StringTemplateMiddle(pos, s);
        } else {
          tok = new Identifier(pos, s);
        }
      } else if (s.length > 2 && s.substr(0, 2) === "##") {
        tok = new Pragma(pos, s);
      } else if (s.length === 1) {
        if (s === "." || s === ",") {
          tok = new Punctuation(pos, s);
        } else if (s === "[") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WBracketLeftW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WBracketLeft(pos, s);
          } else if (whiteAfter === true) {
            tok = new BracketLeftW(pos, s);
          } else {
            tok = new BracketLeft(pos, s);
          }
        } else if (s === "(") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WParenLeftW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WParenLeft(pos, s);
          } else if (whiteAfter === true) {
            tok = new ParenLeftW(pos, s);
          } else {
            tok = new ParenLeft(pos, s);
          }
        } else if (s === "]") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WBracketRightW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WBracketRight(pos, s);
          } else if (whiteAfter === true) {
            tok = new BracketRightW(pos, s);
          } else {
            tok = new BracketRight(pos, s);
          }
        } else if (s === ")") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WParenRightW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WParenRight(pos, s);
          } else if (whiteAfter === true) {
            tok = new ParenRightW(pos, s);
          } else {
            tok = new ParenRight(pos, s);
          }
        } else if (s === "-") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WDashW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WDash(pos, s);
          } else if (whiteAfter === true) {
            tok = new DashW(pos, s);
          } else {
            tok = new Dash(pos, s);
          }
        } else if (s === "+") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WPlusW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WPlus(pos, s);
          } else if (whiteAfter === true) {
            tok = new PlusW(pos, s);
          } else {
            tok = new Plus(pos, s);
          }
        } else if (s === "@") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WAtW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WAt(pos, s);
          } else if (whiteAfter === true) {
            tok = new AtW(pos, s);
          } else {
            tok = new At(pos, s);
          }
        }
      } else if (s.length === 2) {
        if (s === "->") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WInstanceArrowW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WInstanceArrow(pos, s);
          } else if (whiteAfter === true) {
            tok = new InstanceArrowW(pos, s);
          } else {
            tok = new InstanceArrow(pos, s);
          }
        } else if (s === "=>") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WStaticArrowW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WStaticArrow(pos, s);
          } else if (whiteAfter === true) {
            tok = new StaticArrowW(pos, s);
          } else {
            tok = new StaticArrow(pos, s);
          }
        }
      }
 
      if (tok === undefined) {
        tok = new Identifier(pos, s);
      }
      this.tokens.push(tok);
    }
    this.buffer.clear();
  }
 
  private process(raw: string) {
    this.stream = new LexerStream(raw.replace(/\r/g, ""));
    this.buffer = new LexerBuffer();
 
    const splits: {[name: string]: boolean} = {};
    splits[" "] = true;
    splits[":"] = true;
    splits["."] = true;
    splits[","] = true;
    splits["-"] = true;
    splits["+"] = true;
    splits["("] = true;
    splits[")"] = true;
    splits["["] = true;
    splits["]"] = true;
    splits["\t"] = true;
    splits["\n"] = true;
 
    const bufs: {[name: string]: boolean} = {};
    bufs["."] = true;
    bufs[","] = true;
    bufs[":"] = true;
    bufs["("] = true;
    bufs[")"] = true;
    bufs["["] = true;
    bufs["]"] = true;
    bufs["+"] = true;
    bufs["@"] = true;
 
    for (;;) {
      const current = this.stream.currentChar();
      const buf = this.buffer.add(current);
      const ahead = this.stream.nextChar();
      const aahead = this.stream.nextNextChar();
 
      if (this.m === ModeNormal) {
        if (splits[ahead]) {
          this.add();
        } else if (ahead === "'") {
// start string
          this.add();
          this.m = ModeStr;
        } else if (ahead === "|" || ahead === "}") {
// start template
          this.add();
          this.m = ModeTemplate;
        } else if (ahead === "`") {
// start ping
          this.add();
          this.m = ModePing;
        } else if (aahead === "##") {
// start pragma
          this.add();
          this.m = ModePragma;
        } else if (ahead === "\""
            || (ahead === "*" && current === "\n")) {
// start comment
          this.add();
          this.m = ModeComment;
        } else if (ahead === "@" && buf.trim().length === 0) {
          this.add();
        } else if (aahead === "->"
            || aahead === "=>") {
          this.add();
        } else if (current === ">"
            && ahead !== " "
            && (this.stream.prevChar() === "-" || this.stream.prevChar() === "=")) {
// arrows
          this.add();
        } else if (buf.length === 1
            && (bufs[buf]
            || (buf === "-" && ahead !== ">"))) {
          this.add();
        }
      } else if (this.m === ModePragma && (ahead === "," || ahead === ":" || ahead === "." || ahead === " " || ahead === "\n")) {
// end of pragma
        this.add();
        this.m = ModeNormal;
      } else if (this.m === ModePing
          && buf.length > 1
          && current === "`"
          && aahead !== "``"
          && ahead !== "`"
          && this.buffer.countIsEven("`")) {
// end of ping
        this.add();
        if (ahead === `"`) {
          this.m = ModeComment;
        } else {
          this.m = ModeNormal;
        }
      } else if (this.m === ModeTemplate
          && buf.length > 1
          && (current === "|" || current === "{")
          && (this.stream.prevChar() !== "\\" || this.stream.prevPrevChar() === "\\\\")) {
// end of template
        this.add();
        this.m = ModeNormal;
      } else if (this.m === ModeTemplate
          && ahead === "}"
          && current !== "\\") {
        this.add();
      } else if (this.m === ModeStr
          && current === "'"
          && buf.length > 1
          && aahead !== "''"
          && ahead !== "'"
          && this.buffer.countIsEven("'")) {
// end of string
        this.add();
        if (ahead === "\"") {
          this.m = ModeComment;
        } else {
          this.m = ModeNormal;
        }
      } else if (ahead === "\n" && this.m !== ModeTemplate) {
        this.add();
        this.m = ModeNormal;
      } else if (this.m === ModeTemplate && current === "\n") {
        this.add();
      }
 
      if (!this.stream.advance()) {
        break;
      }
    }
 
    this.add();
  }
 
}