CLASS zcl_abapgit_syntax_highlighter DEFINITION
PUBLIC
ABSTRACT
CREATE PUBLIC .
PUBLIC SECTION.
CLASS-METHODS create
IMPORTING
!iv_filename TYPE string
RETURNING
VALUE(ro_instance) TYPE REF TO zcl_abapgit_syntax_highlighter .
METHODS process_line
IMPORTING
!iv_line TYPE string
RETURNING
VALUE(rv_line) TYPE string .
PROTECTED SECTION.
TYPES:
BEGIN OF ty_match,
token TYPE c LENGTH 1, " Type of matches
offset TYPE i, " Beginning position of the string that should be formatted
length TYPE i, " Length of the string that should be formatted
text_tag TYPE string, " Type of text tag
END OF ty_match .
TYPES:
ty_match_tt TYPE STANDARD TABLE OF ty_match WITH DEFAULT KEY .
TYPES:
BEGIN OF ty_rule,
regex TYPE REF TO cl_abap_regex,
token TYPE c LENGTH 1,
style TYPE string,
relevant_submatch TYPE i,
END OF ty_rule .
CONSTANTS c_token_none TYPE c VALUE '.' ##NO_TEXT.
DATA:
mt_rules TYPE STANDARD TABLE OF ty_rule .
METHODS add_rule
IMPORTING
!iv_regex TYPE string
!iv_token TYPE c
!iv_style TYPE string
!iv_submatch TYPE i OPTIONAL .
METHODS parse_line
IMPORTING
!iv_line TYPE string
RETURNING
VALUE(rt_matches) TYPE ty_match_tt .
METHODS order_matches
ABSTRACT
IMPORTING
!iv_line TYPE string
CHANGING
!ct_matches TYPE ty_match_tt .
METHODS extend_matches
IMPORTING
!iv_line TYPE string
CHANGING
!ct_matches TYPE ty_match_tt .
METHODS format_line
IMPORTING
!iv_line TYPE string
!it_matches TYPE ty_match_tt
RETURNING
VALUE(rv_line) TYPE string .
METHODS apply_style
IMPORTING
!iv_line TYPE string
!iv_class TYPE string
RETURNING
VALUE(rv_line) TYPE string .
METHODS is_whitespace
IMPORTING
!iv_string TYPE string
RETURNING
VALUE(rv_result) TYPE abap_bool .
PRIVATE SECTION.
ENDCLASS.
CLASS ZCL_ABAPGIT_SYNTAX_HIGHLIGHTER IMPLEMENTATION.
METHOD add_rule.
DATA ls_rule LIKE LINE OF mt_rules.
IF NOT iv_regex IS INITIAL.
CREATE OBJECT ls_rule-regex
EXPORTING
pattern = iv_regex
ignore_case = abap_true.
ENDIF.
ls_rule-token = iv_token.
ls_rule-style = iv_style.
ls_rule-relevant_submatch = iv_submatch.
APPEND ls_rule TO mt_rules.
ENDMETHOD.
METHOD apply_style.
DATA lv_escaped TYPE string.
lv_escaped = escape( val = iv_line
format = cl_abap_format=>e_html_attr ).
IF iv_class IS NOT INITIAL.
rv_line = |{ lv_escaped }|.
ELSE.
rv_line = lv_escaped.
ENDIF.
ENDMETHOD.
METHOD create.
" Create instance of highighter dynamically dependent on syntax type
IF iv_filename CP '*.abap'.
CREATE OBJECT ro_instance TYPE zcl_abapgit_syntax_abap.
ELSEIF iv_filename CP '*.xml' OR iv_filename CP '*.html'.
CREATE OBJECT ro_instance TYPE zcl_abapgit_syntax_xml.
ELSEIF iv_filename CP '*.css'.
CREATE OBJECT ro_instance TYPE zcl_abapgit_syntax_css.
ELSEIF iv_filename CP '*.js'.
CREATE OBJECT ro_instance TYPE zcl_abapgit_syntax_js.
ELSEIF iv_filename CP '*.json'.
CREATE OBJECT ro_instance TYPE zcl_abapgit_syntax_json.
ELSE.
CLEAR ro_instance.
ENDIF.
ENDMETHOD.
METHOD extend_matches.
DATA: lv_line_len TYPE i,
lv_last_pos TYPE i VALUE 0,
lv_length TYPE i,
ls_match TYPE ty_match.
FIELD-SYMBOLS TYPE ty_match.
lv_line_len = strlen( iv_line ).
SORT ct_matches BY offset.
" Add entries refering to parts of text that should not be formatted
LOOP AT ct_matches ASSIGNING .
IF -offset > lv_last_pos.
lv_length = -offset - lv_last_pos.
ls_match-token = c_token_none.
ls_match-offset = lv_last_pos.
ls_match-length = lv_length.
INSERT ls_match INTO ct_matches INDEX sy-tabix.
ENDIF.
lv_last_pos = -offset + -length.
ENDLOOP.
" Add remainder of the string
IF lv_line_len > lv_last_pos.
lv_length = lv_line_len - lv_last_pos.
ls_match-token = c_token_none.
ls_match-offset = lv_last_pos.
ls_match-length = lv_length.
APPEND ls_match TO ct_matches.
ENDIF.
ENDMETHOD.
METHOD format_line.
DATA:
lv_chunk TYPE string,
ls_rule LIKE LINE OF mt_rules.
FIELD-SYMBOLS TYPE ty_match.
LOOP AT it_matches ASSIGNING .
lv_chunk = substring( val = iv_line
off = -offset
len = -length ).
CLEAR ls_rule. " Failed read equals no style
READ TABLE mt_rules INTO ls_rule WITH KEY token = -token.
lv_chunk = me->apply_style( iv_line = lv_chunk
iv_class = ls_rule-style ).
rv_line = rv_line && lv_chunk.
ENDLOOP.
ENDMETHOD.
METHOD is_whitespace.
DATA: lv_whitespace TYPE string.
"/^\s+$/
lv_whitespace = ` ` && cl_abap_char_utilities=>horizontal_tab && cl_abap_char_utilities=>cr_lf.
IF iv_string CO lv_whitespace.
rv_result = abap_true.
ELSE.
rv_result = abap_false.
ENDIF.
ENDMETHOD.
METHOD parse_line.
DATA:
lo_regex TYPE REF TO cl_abap_regex,
lo_matcher TYPE REF TO cl_abap_matcher,
lt_result TYPE match_result_tab,
ls_match TYPE ty_match.
FIELD-SYMBOLS:
LIKE LINE OF mt_rules,
TYPE match_result,
LIKE LINE OF -submatches.
" Process syntax-dependent regex table and find all matches
LOOP AT mt_rules ASSIGNING WHERE regex IS BOUND.
lo_regex = -regex.
lo_matcher = lo_regex->create_matcher( text = iv_line ).
lt_result = lo_matcher->find_all( ).
" Save matches into custom table with predefined tokens
LOOP AT lt_result ASSIGNING .
CLEAR: ls_match.
IF -relevant_submatch = 0.
ls_match-token = -token.
ls_match-offset = -offset.
ls_match-length = -length.
APPEND ls_match TO rt_matches.
ELSE.
READ TABLE -submatches ASSIGNING INDEX -relevant_submatch.
"submatch might be empty if only discarted parts matched
IF sy-subrc = 0 AND -offset >= 0 AND -length > 0.
ls_match-token = -token.
ls_match-offset = -offset.
ls_match-length = -length.
APPEND ls_match TO rt_matches.
ENDIF.
ENDIF.
ENDLOOP.
ENDLOOP.
ENDMETHOD.
METHOD process_line.
DATA: lt_matches TYPE ty_match_tt.
IF iv_line IS INITIAL OR is_whitespace( iv_line ) = abap_true.
rv_line = iv_line.
RETURN.
ENDIF.
lt_matches = me->parse_line( iv_line ).
me->order_matches( EXPORTING iv_line = iv_line
CHANGING ct_matches = lt_matches ).
me->extend_matches( EXPORTING iv_line = iv_line
CHANGING ct_matches = lt_matches ).
rv_line = me->format_line( iv_line = iv_line
it_matches = lt_matches ).
ENDMETHOD.
ENDCLASS.