All files / src/abap/1_lexer lexer.ts

97.24% Statements 318/327
95.65% Branches 198/207
100% Functions 3/3
97.24% Lines 318/327

Press n or j to go to the next uncovered block, b, p or k for the previous block.

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 3271x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 1x 1x 345140x 345140x 209025x 209025x 209025x 209025x 209025x 201365x 201365x 143615x 143615x 201365x 209025x 209025x 209025x 209025x 183776x 183776x 209025x 209025x 209025x 259x 259x 209025x 209025x 209025x 320x 209025x 2799x 208705x 652x 652x 652x 276x 652x 181x 376x 179x 195x 11x 16x 5x 5x 205906x 81x 205254x 71542x 31190x 71542x 289x 6x 289x   283x 232x 283x 51x 51x 40352x 7102x 1206x 7102x 471x 5896x 2872x 5425x 2553x 2553x 40063x 289x 176x 289x 62x 113x 46x 51x 5x 5x 32961x 7104x 3984x 7104x 80x 3120x 3000x 3040x 40x 40x 32672x 4299x 93x 4299x 30x 4206x 10x 4176x 4166x 4166x 25568x 464x 185x 464x 206x 279x 2x 73x 71x 71x 21269x 2438x   2438x 2424x 2438x   14x 14x 14x 2438x 205173x 13584x 536x   536x 1x 536x   535x 535x 535x 13584x 474x 2x 474x   472x   472x 472x 472x 474x 13584x 209025x 209025x 326x 326x 326x 326x 326x 205x 205x 326x 209025x 209025x 150783x 150783x 209025x 209025x 345140x 345140x 1x 1x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 10471x 1117684x 1117684x 1117684x 1117684x 1117684x 1117684x 1089492x 303500x 1089492x 2642x 2642x 2642x 785992x 651x 651x 651x 783350x 157x 157x 157x 782699x 81x 81x 81x 782542x 782461x 315x 315x 315x 782461x 2426x 782146x 779720x 474x 779720x 779246x 779246x 953x 953x 779246x 778293x 778293x 19702x 19702x 1117684x 77x 77x 77x 28192x 28115x 28115x 28115x 28115x 28115x 157x 157x 157x 1x 157x 156x 156x 28115x 27958x 27958x 27958x 651x 651x 651x 27958x 27307x 27307x 1x 27307x 27306x 27306x 27306x 27306x 27306x 2635x 2635x 2635x 4x 2635x 2631x 2631x 27306x 247x 247x 24671x     1117684x 1117684x 10471x 10471x 1117684x 10471x 10471x 10471x 1x 1x
import {IFile} from "../../files/_ifile";
import {Position} from "../../position";
import {VirtualPosition} from "../../virtual_position";
import {AbstractToken} from "./tokens/abstract_token";
import {IABAPLexerResult} from "./lexer_result";
import {At, AtW, AssociationName, BracketLeft, BracketLeftW, BracketRight, BracketRightW, Comment, Dash, DashW, Identifier, InstanceArrow, InstanceArrowW, ParenLeft, ParenLeftW, ParenRight, ParenRightW, Plus, PlusW, Pragma, Punctuation, StaticArrow, StaticArrowW, StringTemplate, StringTemplateBegin, StringTemplateEnd, StringTemplateMiddle, StringToken, WAt, WAtW, WBracketLeft, WBracketLeftW, WBracketRight, WBracketRightW, WDash, WDashW, WInstanceArrow, WInstanceArrowW, WParenLeft, WParenLeftW, WParenRight, WParenRightW, WPlus, WPlusW, WStaticArrow, WStaticArrowW} from "./tokens";
import {LexerBuffer} from "./lexer_buffer";
import {LexerStream} from "./lexer_stream";
 
const ModeNormal: number = 1;
const ModePing: number = 2;
const ModeStr: number = 3;
const ModeTemplate: number = 4;
const ModeComment: number = 5;
const ModePragma: number = 6;
 
export class Lexer {
 
  private virtual: Position | undefined;
  private tokens: AbstractToken[];
  private m: number;
  private stream: LexerStream;
  private buffer: LexerBuffer;
 
  public run(file: IFile, virtual?: Position): IABAPLexerResult {
    this.virtual = virtual;
    this.tokens = [];
    this.m = ModeNormal;
 
    this.process(file.getRaw());
    return {file, tokens: this.tokens};
  }
 
  private add() {
    const s = this.buffer.get().trim();
    if (s.length > 0) {
      const col = this.stream.getCol();
      const row = this.stream.getRow();
 
      let whiteBefore = false;
      if (this.stream.getOffset() - s.length >= 0) {
        const prev = this.stream.getRaw().substr(this.stream.getOffset() - s.length, 1);
        if (prev === " " || prev === "\n" || prev === "\t" || prev === ":") {
          whiteBefore = true;
        }
      }
 
      let whiteAfter = false;
      const next = this.stream.nextChar();
      if (next === " " || next === "\n" || next === "\t" || next === ":" || next === "," || next === "." || next === "" || next === "\"") {
        whiteAfter = true;
      }
 
      let pos = new Position(row, col - s.length);
      if (this.virtual) {
        pos = new VirtualPosition(this.virtual, pos.getRow(), pos.getCol());
      }
 
      let tok: AbstractToken | undefined = undefined;
      if (this.m === ModeComment) {
        tok = new Comment(pos, s);
      } else if (this.m === ModePing || this.m === ModeStr) {
        tok = new StringToken(pos, s);
      } else if (this.m === ModeTemplate) {
        const first = s.charAt(0);
        const last = s.charAt(s.length - 1);
        if (first === "|" && last === "|") {
          tok = new StringTemplate(pos, s);
        } else if (first === "|" && last === "{" && whiteAfter === true) {
          tok = new StringTemplateBegin(pos, s);
        } else if (first === "}" && last === "|" && whiteBefore === true) {
          tok = new StringTemplateEnd(pos, s);
        } else if (first === "}" && last === "{" && whiteAfter === true && whiteBefore === true) {
          tok = new StringTemplateMiddle(pos, s);
        } else {
          tok = new Identifier(pos, s);
        }
      } else if (s.length > 2 && s.substr(0, 2) === "##") {
        tok = new Pragma(pos, s);
      } else if (s.length === 1) {
        if (s === "." || s === ",") {
          tok = new Punctuation(pos, s);
        } else if (s === "[") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WBracketLeftW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WBracketLeft(pos, s);
          } else if (whiteAfter === true) {
            tok = new BracketLeftW(pos, s);
          } else {
            tok = new BracketLeft(pos, s);
          }
        } else if (s === "(") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WParenLeftW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WParenLeft(pos, s);
          } else if (whiteAfter === true) {
            tok = new ParenLeftW(pos, s);
          } else {
            tok = new ParenLeft(pos, s);
          }
        } else if (s === "]") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WBracketRightW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WBracketRight(pos, s);
          } else if (whiteAfter === true) {
            tok = new BracketRightW(pos, s);
          } else {
            tok = new BracketRight(pos, s);
          }
        } else if (s === ")") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WParenRightW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WParenRight(pos, s);
          } else if (whiteAfter === true) {
            tok = new ParenRightW(pos, s);
          } else {
            tok = new ParenRight(pos, s);
          }
        } else if (s === "-") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WDashW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WDash(pos, s);
          } else if (whiteAfter === true) {
            tok = new DashW(pos, s);
          } else {
            tok = new Dash(pos, s);
          }
        } else if (s === "+") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WPlusW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WPlus(pos, s);
          } else if (whiteAfter === true) {
            tok = new PlusW(pos, s);
          } else {
            tok = new Plus(pos, s);
          }
        } else if (s === "@") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WAtW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WAt(pos, s);
          } else if (whiteAfter === true) {
            tok = new AtW(pos, s);
          } else {
            tok = new At(pos, s);
          }
        }
      } else if (s.length === 2) {
        if (s === "->") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WInstanceArrowW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WInstanceArrow(pos, s);
          } else if (whiteAfter === true) {
            tok = new InstanceArrowW(pos, s);
          } else {
            tok = new InstanceArrow(pos, s);
          }
        } else if (s === "=>") {
          if (whiteBefore === true && whiteAfter === true) {
            tok = new WStaticArrowW(pos, s);
          } else if (whiteBefore === true) {
            tok = new WStaticArrow(pos, s);
          } else if (whiteAfter === true) {
            tok = new StaticArrowW(pos, s);
          } else {
            tok = new StaticArrow(pos, s);
          }
        }
      }
 
      if (tok === undefined && this.m === ModeNormal && s.charAt(0) === "\\") {
        const adj = this.stream.nextChar() === "" ? 1 : 0;
        const prevOffset = this.stream.getOffset() - s.length - adj;
        const prevChar = prevOffset >= 0 ? this.stream.getRaw().substr(prevOffset, 1) : "";
        const whiteBeforeBackslash = prevChar === " " || prevChar === "\n" || prevChar === "\t" || prevChar === ":";
        if (!whiteBeforeBackslash) {
          tok = new AssociationName(pos, s);
        }
      }
 
      if (tok === undefined) {
        tok = new Identifier(pos, s);
      }
      this.tokens.push(tok);
    }
    this.buffer.clear();
  }
 
  private process(raw: string) {
    this.stream = new LexerStream(raw.replace(/\r/g, ""));
    this.buffer = new LexerBuffer();
 
    const splits: {[name: string]: boolean} = {};
    splits[" "] = true;
    splits[":"] = true;
    splits["."] = true;
    splits[","] = true;
    splits["-"] = true;
    splits["+"] = true;
    splits["("] = true;
    splits[")"] = true;
    splits["["] = true;
    splits["]"] = true;
    splits["\\"] = true;
    splits["\t"] = true;
    splits["\n"] = true;
 
    const bufs: {[name: string]: boolean} = {};
    bufs["."] = true;
    bufs[","] = true;
    bufs[":"] = true;
    bufs["("] = true;
    bufs[")"] = true;
    bufs["["] = true;
    bufs["]"] = true;
    bufs["+"] = true;
    bufs["@"] = true;
 
    for (;;) {
      const current = this.stream.currentChar();
      const buf = this.buffer.add(current);
      const ahead = this.stream.nextChar();
      const aahead = this.stream.nextNextChar();
 
      if (this.m === ModeNormal) {
        if (splits[ahead]) {
          this.add();
        } else if (ahead === "'") {
// start string
          this.add();
          this.m = ModeStr;
        } else if (ahead === "|" || ahead === "}") {
// start template
          this.add();
          this.m = ModeTemplate;
        } else if (ahead === "`") {
// start ping
          this.add();
          this.m = ModePing;
        } else if (aahead === "##") {
// start pragma
          this.add();
          this.m = ModePragma;
        } else if (ahead === "\""
            || (ahead === "*" && current === "\n")) {
// start comment
          this.add();
          this.m = ModeComment;
        } else if (ahead === "@" && buf.trim().length === 0) {
          this.add();
        } else if (aahead === "->"
            || aahead === "=>") {
          this.add();
        } else if (current === ">"
            && ahead !== " "
            && (this.stream.prevChar() === "-" || this.stream.prevChar() === "=")) {
// arrows
          this.add();
        } else if (buf.length === 1
            && (bufs[buf]
            || (buf === "-" && ahead !== ">"))) {
          this.add();
        }
      } else if (this.m === ModePragma && (ahead === "," || ahead === ":" || ahead === "." || ahead === " " || ahead === "\n")) {
// end of pragma
        this.add();
        this.m = ModeNormal;
      } else if (this.m === ModePing
          && buf.length > 1
          && current === "`"
          && aahead !== "``"
          && ahead !== "`"
          && this.buffer.countIsEven("`")) {
// end of ping
        this.add();
        if (ahead === `"`) {
          this.m = ModeComment;
        } else {
          this.m = ModeNormal;
        }
      } else if (this.m === ModeTemplate
          && buf.length > 1
          && (current === "|" || current === "{")
          && (this.stream.prevChar() !== "\\" || this.stream.prevPrevChar() === "\\\\")) {
// end of template
        this.add();
        this.m = ModeNormal;
      } else if (this.m === ModeTemplate
          && ahead === "}"
          && current !== "\\") {
        this.add();
      } else if (this.m === ModeStr
          && current === "'"
          && buf.length > 1
          && aahead !== "''"
          && ahead !== "'"
          && this.buffer.countIsEven("'")) {
// end of string
        this.add();
        if (ahead === "\"") {
          this.m = ModeComment;
        } else {
          this.m = ModeNormal;
        }
      } else if (ahead === "\n" && this.m !== ModeTemplate) {
        this.add();
        this.m = ModeNormal;
      } else if (this.m === ModeTemplate && current === "\n") {
        this.add();
      }
 
      if (!this.stream.advance()) {
        break;
      }
    }
 
    this.add();
  }
 
}