All files / src/abap/1_lexer lexer.ts

96.19% Statements 303/315
94.38% Branches 185/196
100% Functions 4/4
96.19% Lines 303/315

Press n or j to go to the next uncovered block, b, p or k for the previous block.

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 3151x 1x 1x 1x 1x 1x 1x 1x 1x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 240948x 240948x 154745x 154745x 154745x 154745x 154745x 149304x 149304x 106306x 106306x 149304x 154745x 154745x 154745x 154745x 138025x 138025x 154745x 154745x 154745x 204x 204x 154745x 154745x 154745x 288x 154745x 2415x 154457x 601x 601x 601x 271x 601x 160x 330x 158x 170x 7x 12x 5x 5x 152042x 74x 151441x 53821x 25012x 53821x 176x   176x   176x 135x 176x 41x 41x 28809x 4939x 888x 4939x 344x 4051x 2091x 3707x 1616x 1616x 28633x 176x 100x 176x 35x 76x 41x 41x     23694x 4941x 2897x 4941x 68x 2044x 1960x 1976x 16x 16x 23518x 3316x 40x 3316x 16x 3276x 9x 3260x 3251x 3251x 18577x 224x 151x 224x 18x 73x 1x 55x 54x 54x 15261x 421x   421x 407x 421x   14x 14x 14x 421x 151367x 9442x 421x   421x 1x 421x   420x 420x 420x 9442x 422x 2x 422x   420x   420x 420x 420x 422x 9442x 154745x 154745x 111319x 111319x 154745x 154745x 240948x 240948x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 7853x 820308x 820308x 820308x 820308x 820308x 820308x 795410x 211803x 795410x 2260x 2260x 2260x 583607x 600x 600x 600x 581347x 155x 155x 155x 580747x 74x 74x 74x 580592x 580518x 283x 283x 283x 580518x 409x 580235x 579826x 422x 579826x 579404x 579404x 821x 821x 579404x 578583x 578583x 12962x 12962x 820308x 70x 70x 70x 24898x 24828x 24828x 24828x 24828x 24828x 155x 155x 155x 1x 155x 154x 154x 24828x 24673x 24673x 24673x 600x 600x 600x 24673x 24073x 24073x 1x 24073x 24072x 24072x 24072x 24072x 24072x 2253x 2253x 2253x 4x 2253x 2249x 2249x 24072x 227x 227x 21819x     820308x 820308x 7853x 7853x 820308x 7853x 7853x 7853x 7853x 7853x
import {IFile} from "../../files/_ifile";
import {Position} from "../../position";
import {VirtualPosition} from "../../virtual_position";
import {AbstractToken} from "./tokens/abstract_token";
import {IABAPLexerResult} from "./lexer_result";
import {At, AtW, BracketLeft, BracketLeftW, BracketRight, BracketRightW, Comment, Dash, DashW, Identifier, InstanceArrow, InstanceArrowW, ParenLeft, ParenLeftW, ParenRight, ParenRightW, Plus, PlusW, Pragma, Punctuation, StaticArrow, StaticArrowW, StringTemplate, StringTemplateBegin, StringTemplateEnd, StringTemplateMiddle, StringToken, WAt, WAtW, WBracketLeft, WBracketLeftW, WBracketRight, WBracketRightW, WDash, WDashW, WInstanceArrow, WInstanceArrowW, WParenLeft, WParenLeftW, WParenRight, WParenRightW, WPlus, WPlusW, WStaticArrow, WStaticArrowW} from "./tokens";
import {LexerBuffer} from "./lexer_buffer";
import {LexerStream} from "./lexer_stream";
 
export class Lexer {
  private readonly ModeNormal: number = 1;
  private readonly ModePing: number = 2;
  private readonly ModeStr: number = 3;
  private readonly ModeTemplate: number = 4;
  private readonly ModeComment: number = 5;
  private readonly ModePragma: number = 6;
 
  private virtual: Position | undefined;
  private tokens: AbstractToken[];
  private m: number;
  private stream: LexerStream;
  private buffer: LexerBuffer;
 
  public run(file: IFile, virtual?: Position): IABAPLexerResult {
    this.virtual = virtual;
    this.tokens = [];
    this.m = this.ModeNormal;
 
    this.process(file.getRaw());
    return {file, tokens: this.tokens};
  }
 
  private add() {
    const s = this.buffer.get().trim();
    if (s.length > 0) {
      const col = this.stream.getCol();
      const row = this.stream.getRow();
 
      let whiteBefore = false;
      if (this.stream.getOffset() - s.length >= 0) {
        const prev = this.stream.getRaw().substr(this.stream.getOffset() - s.length, 1);
        if (prev === " " || prev === "\n" || prev === "\t" || prev === ":") {
          whiteBefore = true;
        }
      }
 
      let whiteAfter = false;
      const next = this.stream.nextChar();
      if (next === " " || next === "\n" || next === "\t" || next === ":" || next === "," || next === "." || next === "" || next === "\"") {
        whiteAfter = true;
      }
 
      let pos = new Position(row, col - s.length);
      if (this.virtual) {
        pos = new VirtualPosition(this.virtual, pos.getRow(), pos.getCol());
      }
 
      let tok: AbstractToken | undefined = undefined;
      if (this.m === this.ModeComment) {
        tok = new Comment(pos, s);
      } else if (this.m === this.ModePing || this.m === this.ModeStr) {
        tok = new StringToken(pos, s);
      } else if (this.m === this.ModeTemplate) {
        const first = s.charAt(0);
        const last = s.charAt(s.length - 1);
        if (first === "|" && last === "|") {
          tok = new StringTemplate(pos, s);
        } else if (first === "|" && last === "{" && whiteAfter === true) {
          tok = new StringTemplateBegin(pos, s);
        } else if (first === "}" && last === "|" && whiteBefore === true) {
          tok = new StringTemplateEnd(pos, s);
        } else if (first === "}" && last === "{" && whiteAfter === true && whiteBefore === true) {
          tok = new StringTemplateMiddle(pos, s);
        } else {
          tok = new Identifier(pos, s);
        }
      } else if (s.length > 2 && s.substr(0, 2) === "##") {
        tok = new Pragma(pos, s);
      } else if (s.length === 1) {
        if (s === "." || s === ",") {
          tok = new Punctuation(pos, s);
        } else if (s === "[") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WBracketLeftW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WBracketLeft(pos, s);
          } else if (whiteAfter === true) {
            tok = new BracketLeftW(pos, s);
          } else {
            tok = new BracketLeft(pos, s);
          }
        } else if (s === "(") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WParenLeftW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WParenLeft(pos, s);
          } else if (whiteAfter === true) {
            tok = new ParenLeftW(pos, s);
          } else {
            tok = new ParenLeft(pos, s);
          }
        } else if (s === "]") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WBracketRightW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WBracketRight(pos, s);
          } else if (whiteAfter === true) {
            tok = new BracketRightW(pos, s);
          } else {
            tok = new BracketRight(pos, s);
          }
        } else if (s === ")") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WParenRightW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WParenRight(pos, s);
          } else if (whiteAfter === true) {
            tok = new ParenRightW(pos, s);
          } else {
            tok = new ParenRight(pos, s);
          }
        } else if (s === "-") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WDashW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WDash(pos, s);
          } else if (whiteAfter === true) {
            tok = new DashW(pos, s);
          } else {
            tok = new Dash(pos, s);
          }
        } else if (s === "+") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WPlusW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WPlus(pos, s);
          } else if (whiteAfter === true) {
            tok = new PlusW(pos, s);
          } else {
            tok = new Plus(pos, s);
          }
        } else if (s === "@") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WAtW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WAt(pos, s);
          } else if (whiteAfter === true) {
            tok = new AtW(pos, s);
          } else {
            tok = new At(pos, s);
          }
        }
      } else if (s.length === 2) {
        if (s === "->") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WInstanceArrowW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WInstanceArrow(pos, s);
          } else if (whiteAfter === true) {
            tok = new InstanceArrowW(pos, s);
          } else {
            tok = new InstanceArrow(pos, s);
          }
        } else if (s === "=>") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WStaticArrowW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WStaticArrow(pos, s);
          } else if (whiteAfter === true) {
            tok = new StaticArrowW(pos, s);
          } else {
            tok = new StaticArrow(pos, s);
          }
        }
      }
 
      if (tok === undefined) {
        tok = new Identifier(pos, s);
      }
      this.tokens.push(tok);
    }
    this.buffer.clear();
  }
 
  private process(raw: string) {
    this.stream = new LexerStream(raw.replace(/\r/g, ""));
    this.buffer = new LexerBuffer();
 
    const splits: {[name: string]: boolean} = {};
    splits[" "] = true;
    splits[":"] = true;
    splits["."] = true;
    splits[","] = true;
    splits["-"] = true;
    splits["+"] = true;
    splits["("] = true;
    splits[")"] = true;
    splits["["] = true;
    splits["]"] = true;
    splits["\t"] = true;
    splits["\n"] = true;
 
    const bufs: {[name: string]: boolean} = {};
    bufs["."] = true;
    bufs[","] = true;
    bufs[":"] = true;
    bufs["("] = true;
    bufs[")"] = true;
    bufs["["] = true;
    bufs["]"] = true;
    bufs["+"] = true;
    bufs["@"] = true;
 
    for (;;) {
      const current = this.stream.currentChar();
      const buf = this.buffer.add(current);
      const ahead = this.stream.nextChar();
      const aahead = this.stream.nextNextChar();
 
      if (this.m === this.ModeNormal) {
        if (splits[ahead]) {
          this.add();
        } else if (ahead === "'") {
// start string
          this.add();
          this.m = this.ModeStr;
        } else if (ahead === "|" || ahead === "}") {
// start template
          this.add();
          this.m = this.ModeTemplate;
        } else if (ahead === "`") {
// start ping
          this.add();
          this.m = this.ModePing;
        } else if (aahead === "##") {
// start pragma
          this.add();
          this.m = this.ModePragma;
        } else if (ahead === "\""
            || (ahead === "*" && current === "\n")) {
// start comment
          this.add();
          this.m = this.ModeComment;
        } else if (ahead === "@" && buf.trim().length === 0) {
          this.add();
        } else if (aahead === "->"
            || aahead === "=>") {
          this.add();
        } else if (current === ">"
            && ahead !== " "
            && (this.stream.prevChar() === "-" || this.stream.prevChar() === "=")) {
// arrows
          this.add();
        } else if (buf.length === 1
            && (bufs[buf]
            || (buf === "-" && ahead !== ">"))) {
          this.add();
        }
      } else if (this.m === this.ModePragma && (ahead === "," || ahead === ":" || ahead === "." || ahead === " " || ahead === "\n")) {
// end of pragma
        this.add();
        this.m = this.ModeNormal;
      } else if (this.m === this.ModePing
          && buf.length > 1
          && current === "`"
          && aahead !== "``"
          && ahead !== "`"
          && this.buffer.countIsEven("`")) {
// end of ping
        this.add();
        if (ahead === `"`) {
          this.m = this.ModeComment;
        } else {
          this.m = this.ModeNormal;
        }
      } else if (this.m === this.ModeTemplate
          && buf.length > 1
          && (current === "|" || current === "{")
          && (this.stream.prevChar() !== "\\" || this.stream.prevPrevChar() === "\\\\")) {
// end of template
        this.add();
        this.m = this.ModeNormal;
      } else if (this.m === this.ModeTemplate
          && ahead === "}"
          && current !== "\\") {
        this.add();
      } else if (this.m === this.ModeStr
          && current === "'"
          && buf.length > 1
          && aahead !== "''"
          && ahead !== "'"
          && this.buffer.countIsEven("'")) {
// end of string
        this.add();
        if (ahead === "\"") {
          this.m = this.ModeComment;
        } else {
          this.m = this.ModeNormal;
        }
      } else if (ahead === "\n" && this.m !== this.ModeTemplate) {
        this.add();
        this.m = this.ModeNormal;
      } else if (this.m === this.ModeTemplate && current === "\n") {
        this.add();
      }
 
      if (!this.stream.advance()) {
        break;
      }
    }
 
    this.add();
  }
 
}