summaryrefslogtreecommitdiff
path: root/urlscanner.l
blob: 5f9acb6b93489a188a47e764499dfd3ae0c65d18 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
%option noyywrap
%option yylineno
%option nounput
%option nodefault

%{
#include "urlscanner.h"
#include "string.h"
yystype yylval;
%}

%x ATAG_HREF
%x ATAG_BETWEEN
%x ATAG_DESC

%%

[^<]* {  }

"<a"[^>]*"href=\"" { BEGIN(ATAG_HREF); }

<ATAG_HREF>[^\"]+ {
  yylval = strdup(yytext);
  BEGIN(ATAG_BETWEEN);
  return TOKEN_URL;
}

<ATAG_HREF>\" {
  yylval = "";
  BEGIN(ATAG_BETWEEN);
  return TOKEN_URL;
}

<ATAG_BETWEEN>[^>]* { }

<ATAG_BETWEEN>">" { BEGIN(ATAG_DESC); }

<ATAG_DESC>[^<]* {
  yylval = strdup(yytext);
  BEGIN(INITIAL);
  return TOKEN_TEXT;
}

. { /* skip */ }

<<EOF>>                            { return MYEOF; }

%%

void scan_string(const char* str) {
    yy_switch_to_buffer(yy_scan_string(str));
}