markdown_25.0.0_0acbc1c0/source/parser/implementation/markdown-implementation-paragraphs-tables.adb

  1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
--
--  Copyright (C) 2021-2024, AdaCore
--
--  SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
--

with VSS.Regular_Expressions;

package body Markdown.Implementation.Paragraphs.Tables is

   Cell_Pattern : constant Wide_Wide_String :=
     " *((?: *(?:[^ |\\]|\\.))*) *(\|)?";
   --  Group 1 - cell text with spaces stripped
   --  Group 2 - pipe separator if any

   Cell : VSS.Regular_Expressions.Regular_Expression;
   --  Regexp of Cell_Pattern

   Delimiter_Pattern : constant Wide_Wide_String := ":?-+:?";
   --  The delimiter row consists of cells whose only content are hyphens (-),
   --  and optionally, a leading or trailing colon (:), or both

   Delimiter : VSS.Regular_Expressions.Regular_Expression;
   --  Regexp of Delimiter_Pattern

   Anchored : constant VSS.Regular_Expressions.Match_Options :=
     [VSS.Regular_Expressions.Anchored_Match => True];

   procedure Split_Table_Row
     (Text  : VSS.Strings.Virtual_String;
      First : VSS.Strings.Character_Iterators.Character_Iterator;
      Cells : out VSS.String_Vectors.Virtual_String_Vector;
      Weak  : Boolean);
   --  Split Text into table cells vector according to GFM rules.
   --  If Weak = True then accept a first cell exev when it doesn't end with
   --  a pipe (|).

   function Is_Delimiter (Cell : VSS.Strings.Virtual_String) return Boolean is
     (Delimiter.Match (Cell, Anchored).Has_Match);

   function Is_Delimiter_Row
     (Cells : VSS.String_Vectors.Virtual_String_Vector) return Boolean is
       (for all Cell of Cells => Is_Delimiter (Cell));

   -----------------
   -- Append_Line --
   -----------------

   overriding procedure Append_Line
     (Self  : in out Paragraph;
      Input : Input_Position;
      CIP   : Can_Interrupt_Paragraph;
      Ok    : in out Boolean)
   is
      Cells : VSS.String_Vectors.Virtual_String_Vector;
   begin
      Ok := Input.First.Has_Element and not CIP;

      if Ok then

         if Self.Column_Count > 0 then

            Split_Table_Row (Input.Line.Expanded, Input.First, Cells, True);

            if Cells.Length > Self.Column_Count then
               for J in 1 .. Self.Column_Count loop
                  Self.Cells.Append (Cells (J));
               end loop;
            else
               Self.Cells.Append (Cells);

               for J in Cells.Length + 1 .. Self.Column_Count loop
                  Self.Cells.Append (VSS.Strings.Empty_Virtual_String);
               end loop;
            end if;
         elsif Self.Lines.Length = 1 then
            --  Parse the table delimiter row
            Split_Table_Row (Input.Line.Expanded, Input.First, Cells, False);

            --  The header row must match the delimiter row in the number of
            --  cells. If not, a table will not be recognized:
            if Cells.Is_Empty
              or else not Is_Delimiter_Row (Cells)
              or else Self.Cells.Length /= Cells.Length
            then
               Self.Cells.Clear;
               Self.Lines.Append (Input.Line.Unexpanded_Tail (Input.First));
            else
               --  Turn the paragraph into table:
               Self.Column_Count := Cells.Length;
               Self.Cells.Append (Cells);
            end if;

         else

            Self.Lines.Append (Input.Line.Unexpanded_Tail (Input.First));
         end if;
      end if;
   end Append_Line;

   ----------------------
   -- Complete_Parsing --
   ----------------------

   overriding procedure Complete_Parsing
     (Self   : in out Paragraph;
      Parser : Markdown.Inline_Parsers.Inline_Parser) is
   begin
      Self.Parser := Parser'Unchecked_Access;
   end Complete_Parsing;

   ------------
   -- Create --
   ------------

   overriding function Create
     (Input : not null access Input_Position) return Paragraph
   is
   begin
      return Result : Paragraph do
         --  Keep first line as a table header:
         Split_Table_Row
           (Input.Line.Expanded, Input.First, Result.Cells, False);

         Result.Lines.Append (Input.Line.Unexpanded_Tail (Input.First));
         --  Shift Input.First to end-of-line
         Input.First.Set_After_Last (Input.Line.Expanded);
      end return;
   end Create;

   --------------
   -- Detector --
   --------------

   procedure Detector
     (Input : Input_Position;
      Tag   : in out Ada.Tags.Tag;
      CIP   : out Can_Interrupt_Paragraph)
   is
   begin
      if not Cell.Is_Valid then  --  Construct regexps
         Cell := VSS.Regular_Expressions.To_Regular_Expression
           (VSS.Strings.To_Virtual_String (Cell_Pattern));
         Delimiter := VSS.Regular_Expressions.To_Regular_Expression
           (VSS.Strings.To_Virtual_String (Delimiter_Pattern));
      end if;

      if Input.First.Has_Element then  --  XXX: use Blank_Pattern here
         Tag := Paragraph'Tag;
         CIP := False;
      end if;
   end Detector;

   ---------------------
   -- Split_Table_Row --
   ---------------------

   procedure Split_Table_Row
     (Text  : VSS.Strings.Virtual_String;
      First : VSS.Strings.Character_Iterators.Character_Iterator;
      Cells : out VSS.String_Vectors.Virtual_String_Vector;
      Weak  : Boolean)
   is
      Next : VSS.Strings.Character_Iterators.Character_Iterator;
      Skip : Boolean := True;
   begin
      Next.Set_At (First);

      loop
         declare
            Match : constant VSS.Regular_Expressions.Regular_Expression_Match
              := Cell.Match (Text, Next);
         begin
            if Match.Has_Match and then not Match.Captured.Is_Empty then

               if not Weak and Skip and not Match.Has_Capture (2) then
                  null;  --  Ignore the very first cell if there is no pipe |
               elsif Skip and then Match.Captured (1).Is_Empty then
                  null;  --  Ignore the very first empty cell
               else
                  Cells.Append (Match.Captured (1));
               end if;

               exit when not Match.Has_Capture (2);

               Next.Set_At (Match.Last_Marker);
               Forward (Next);
               Skip := False;
            else

               exit;
            end if;
         end;
      end loop;
   end Split_Table_Row;

   ----------------------------
   -- Table_Column_Alignment --
   ----------------------------

   overriding function Table_Column_Alignment
     (Self : Paragraph; Column : Positive) return Natural
   is
      Text : constant VSS.Strings.Virtual_String := Self.Cells
        (Self.Column_Count + Column);
   begin
      if Text.Starts_With (":") then
         return (if Text.Ends_With (":") then 3 else 1);
      elsif Text.Ends_With (":") then
         return 2;
      else
         return 0;
      end if;
   end Table_Column_Alignment;

end Markdown.Implementation.Paragraphs.Tables;