1/**
2
3	MultiMarkdown -- Lightweight markup processor to produce HTML, LaTeX, and more.
4
5	@file opml-lexer.c
6
7	@brief Tokenize OPML file for parsing
8
9
10	@author	Fletcher T. Penney
11	@bug
12
13**/
14
15/*
16
17	Copyright © 2016 - 2019 Fletcher T. Penney.
18
19
20	The `MultiMarkdown 6` project is released under the MIT License..
21
22	GLibFacade.c and GLibFacade.h are from the MultiMarkdown v4 project:
23
24		https://github.com/fletcher/MultiMarkdown-4/
25
26	MMD 4 is released under both the MIT License and GPL.
27
28
29	CuTest is released under the zlib/libpng license. See CuTest.c for the
30	text of the license.
31
32	uthash library:
33		Copyright (c) 2005-2016, Troy D. Hanson
34
35		Licensed under Revised BSD license
36
37	miniz library:
38		Copyright 2013-2014 RAD Game Tools and Valve Software
39		Copyright 2010-2014 Rich Geldreich and Tenacious Software LLC
40
41		Licensed under the MIT license
42
43	argtable3 library:
44		Copyright (C) 1998-2001,2003-2011,2013 Stewart Heitmann
45		<sheitmann@users.sourceforge.net>
46		All rights reserved.
47
48		Licensed under the Revised BSD License
49
50
51	## The MIT License ##
52
53	Permission is hereby granted, free of charge, to any person obtaining
54	a copy of this software and associated documentation files (the
55	"Software"), to deal in the Software without restriction, including
56	without limitation the rights to use, copy, modify, merge, publish,
57	distribute, sublicense, and/or sell copies of the Software, and to
58	permit persons to whom the Software is furnished to do so, subject to
59	the following conditions:
60
61	The above copyright notice and this permission notice shall be
62	included in all copies or substantial portions of the Software.
63
64	THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
65	EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
66	MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
67	IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
68	CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
69	TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
70	SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
71
72
73	## Revised BSD License ##
74
75	Redistribution and use in source and binary forms, with or without
76	modification, are permitted provided that the following conditions are
77	met:
78	    * Redistributions of source code must retain the above copyright
79	      notice, this list of conditions and the following disclaimer.
80	    * Redistributions in binary form must reproduce the above
81	      copyright notice, this list of conditions and the following
82	      disclaimer in the documentation and/or other materials provided
83	      with the distribution.
84	    * Neither the name of the <organization> nor the
85	      names of its contributors may be used to endorse or promote
86	      products derived from this software without specific prior
87	      written permission.
88
89	THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
90	"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
91	LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
92	A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL <COPYRIGHT
93	HOLDER> BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
94	EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
95	PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES LOSS OF USE, DATA, OR
96	PROFITS OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
97	LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
98	NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
99	SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
100
101
102*/
103
104#include <stdlib.h>
105
106#include "opml-lexer.h"
107#include "opml-parser.h"
108
109
110// Basic scanner struct
111
112#define YYCTYPE		unsigned char
113#define YYCURSOR	s->cur
114#define YYMARKER	s->ptr
115#define YYCTXMARKER	s->ctx
116
117int opml_scan(Scanner * s, const char * stop) {
118
119	scan:
120
121	if (s->cur >= stop) {
122		return 0;
123	}
124
125	s->start = s->cur;
126
127	/*!re2c
128		re2c:yyfill:enable = 0;
129
130		NL														= "\r\n" | '\n' | '\r';
131		WS														= [ \t]+;
132		WSNL													= (NL | WS)+;
133
134		EQUAL													= '=';
135
136		double_quoted											= '"' [^"\x00]* '"';
137
138		text_attribute											= WSNL* 'text' WSNL* EQUAL WSNL*;
139		note_attribute											= WSNL* '_note' WSNL* EQUAL WSNL*;
140
141		contains_newline										= "&#10;" | "&#13;";
142
143		'<?xml' [^>\x00]* '>'									{ return OPML_XML; }
144
145		'<opml' [^>\x00]* '>'									{ return OPML_OPML_OPEN; }
146		'</opml>'												{ return OPML_OPML_CLOSE; }
147
148		'<head' [^>\x00]* '>'									{ return OPML_HEAD_OPEN; }
149		'</head>'												{ return OPML_HEAD_CLOSE; }
150
151		'<title' [^>\x00]* '>'									{ return OPML_TITLE_OPEN; }
152		'</title>'												{ return OPML_TITLE_CLOSE; }
153
154		'<body' [^>\x00]* '>'									{ return OPML_BODY_OPEN; }
155		'</body>'												{ return OPML_BODY_CLOSE; }
156
157		'<outline' text_attribute '"&gt;&gt;Preamble&lt;&lt;"' note_attribute double_quoted WSNL* '>'		{ return OPML_OUTLINE_PREAMBLE; }
158		'<outline' text_attribute '"&gt;&gt;Metadata&lt;&lt;"' WSNL* '>'	{ return OPML_OUTLINE_METADATA; }
159
160
161		'<outline' [^>\x00]* '/>'								{ return OPML_OUTLINE_SELF_CLOSE; }
162		'<outline' [^>\x00]* '>'								{ return OPML_OUTLINE_OPEN; }
163		'</outline>'											{ return OPML_OUTLINE_CLOSE; }
164
165		WSNL													{ return OPML_WSNL; }
166
167		// Skip over anything else - '.' does not include '\n'
168		*														{ goto scan; }
169	*/
170}
171