Class: Ecu::LabelList::DcmLexer

Inherits:

Object

Object
Ecu::LabelList::DcmLexer

show all

Defined in:: lib/ecu/interfaces/dcm/dcm_lexer.rb

Constant Summary collapse

KEYWORDS =

[
  "FUNKTIONEN", "FESTWERT", "FESTWERTEBLOCK", "KENNLINIE", "GRUPPENKENNLINIE", "FESTKENNLINIE",
  "KENNFELD", "GRUPPENKENNFELD", "FESTKENNFELD", "STUETZSTELLENVERTEILUNG",
  "FKT",
  "ST/X", "ST/Y", "WERT", "ST_TX/X", "ST_TX/Y", "TEXT",
  "FUNKTION",
  "EINHEIT_X", "EINHEIT_Y", "EINHEIT_W",
  "LANGNAME", "DISPLAYNAME",
  "END",
].freeze

HEADER =

"KONSERVIERUNG_FORMAT 2.0"

WHITESPACE =

%r{ [ \t]+ }x

NEWLINE =

%r{ \r\n|\n }x

COMMENT =

%r{ ^\*.*$ }x

DIMENSIONS_SEP =

%r{ @ }x

QUOTED_TEXT =

%r{ "[^"]*" }x

IDENTIFIER =

%r{ [A-Za-z][A-Za-z0-9_\.]* }x

UNSIGNED_INT =

%r{ [0]|[1-9][0-9]* }x

INT =

%r{ [-]?#{UNSIGNED_INT} }x

FLOAT_EXP =

%r{ [eE][+-]?[0-9]+ }x

FLOAT =

%r{
     [-+]?
     (?:
        #{UNSIGNED_INT}?[.][0-9]+#{FLOAT_EXP} |      # 1.23e10 or .45e3
        #{UNSIGNED_INT}          #{FLOAT_EXP} |      # 3e4
        #{UNSIGNED_INT}?[.][0-9]+             |      # 7.3 or .50
        #{UNSIGNED_INT} [.][0-9]*                    # 3.02 or 9.
     )
}x

KW_RE =

/#{Regexp.union(KEYWORDS.sort)}\b/

KW_TABLE =

Instance Attribute Summary collapse

#doc ⇒ Object readonly

Returns the value of attribute doc.

Instance Method Summary collapse

#initialize(doc) ⇒ DcmLexer constructor

A new instance of DcmLexer.
#lineno ⇒ Object
#next_token ⇒ Object
#quoted_value ⇒ Object

Extracts quoted-text content without surrounding quotes in a single allocation.
#token_value ⇒ Object

Constructor Details

#initialize(doc) ⇒ `DcmLexer`

Returns a new instance of DcmLexer.

# File 'lib/ecu/interfaces/dcm/dcm_lexer.rb', line 9

def initialize(doc)
  @doc  = doc
  @scan = StringScanner.new(doc)
end

Instance Attribute Details

#doc ⇒ `Object` (readonly)

Returns the value of attribute doc.



8
9
10

# File 'lib/ecu/interfaces/dcm/dcm_lexer.rb', line 8

def doc
  @doc
end

Instance Method Details

#lineno ⇒ `Object`

# File 'lib/ecu/interfaces/dcm/dcm_lexer.rb', line 84

def lineno
  @doc.byteslice(0, @scan.pos).count("\n") +
    (@scan.beginning_of_line? ? 0 : 1)
end

#next_token ⇒ `Object`

# File 'lib/ecu/interfaces/dcm/dcm_lexer.rb', line 48

def next_token
  # This is a hot path during DCM parsing. Make sure to optimize
  # here are far as possible

  @scan.skip(WHITESPACE)

  return if @scan.eos?

  case @doc.getbyte(@scan.pos)
  when 10, 13          then @scan.skip(NEWLINE)        && :NEWLINE        # \n \r
  when 34              then @scan.skip(QUOTED_TEXT)    && :QUOTED_TEXT    # "
  when 42              then @scan.skip(COMMENT)        && :COMMENT        # *
  when 64              then @scan.skip(DIMENSIONS_SEP) && :DIMENSIONS_SEP # @
  when 43, 45, 46, 48..57                                                 # + - . 0-9
    if    @scan.skip(FLOAT) then :FLOAT
    elsif @scan.skip(INT)   then :INT
    else  @scan.getch;           :UNKNOWN_CHAR
    end
  else
    if    s = @scan.scan(KW_RE)    then KW_TABLE[s]
    elsif @scan.skip(HEADER)       then :HEADER
    elsif @scan.skip(IDENTIFIER)   then :IDENTIFIER
    else  @scan.getch;                  :UNKNOWN_CHAR
    end
  end
end

#quoted_value ⇒ `Object`

Extracts quoted-text content without surrounding quotes in a single allocation.



80
81
82

# File 'lib/ecu/interfaces/dcm/dcm_lexer.rb', line 80

def quoted_value
  @scan.string.byteslice(@scan.pos - @scan.matched_size + 1, @scan.matched_size - 2)
end

#token_value ⇒ `Object`



75
76
77

# File 'lib/ecu/interfaces/dcm/dcm_lexer.rb', line 75

def token_value
  @scan.matched
end

Class: Ecu::LabelList::DcmLexer

Constant Summary collapse

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(doc) ⇒ DcmLexer

Instance Attribute Details

#doc ⇒ Object (readonly)

Instance Method Details

#lineno ⇒ Object

#next_token ⇒ Object