xref: /OpenGrok/opengrok-indexer/src/main/jflex/analysis/plain/PlainXref.lex (revision d219b4cea555a12b602d2d5518daa22134ad4879)
1*d219b4ceSAdam Hornacek /*
2*d219b4ceSAdam Hornacek  * CDDL HEADER START
3*d219b4ceSAdam Hornacek  *
4*d219b4ceSAdam Hornacek  * The contents of this file are subject to the terms of the
5*d219b4ceSAdam Hornacek  * Common Development and Distribution License (the "License").
6*d219b4ceSAdam Hornacek  * You may not use this file except in compliance with the License.
7*d219b4ceSAdam Hornacek  *
8*d219b4ceSAdam Hornacek  * See LICENSE.txt included in this distribution for the specific
9*d219b4ceSAdam Hornacek  * language governing permissions and limitations under the License.
10*d219b4ceSAdam Hornacek  *
11*d219b4ceSAdam Hornacek  * When distributing Covered Code, include this CDDL HEADER in each
12*d219b4ceSAdam Hornacek  * file and include the License file at LICENSE.txt.
13*d219b4ceSAdam Hornacek  * If applicable, add the following below this CDDL HEADER, with the
14*d219b4ceSAdam Hornacek  * fields enclosed by brackets "[]" replaced with your own identifying
15*d219b4ceSAdam Hornacek  * information: Portions Copyright [yyyy] [name of copyright owner]
16*d219b4ceSAdam Hornacek  *
17*d219b4ceSAdam Hornacek  * CDDL HEADER END
18*d219b4ceSAdam Hornacek  */
19*d219b4ceSAdam Hornacek 
20*d219b4ceSAdam Hornacek /*
21*d219b4ceSAdam Hornacek  * Copyright (c) 2005, 2021, Oracle and/or its affiliates. All rights reserved.
22*d219b4ceSAdam Hornacek  * Portions Copyright (c) 2017, Chris Fraire <cfraire@me.com>.
23*d219b4ceSAdam Hornacek  */
24*d219b4ceSAdam Hornacek 
25*d219b4ceSAdam Hornacek package org.opengrok.indexer.analysis.plain;
26*d219b4ceSAdam Hornacek 
27*d219b4ceSAdam Hornacek import org.opengrok.indexer.analysis.JFlexSymbolMatcher;
28*d219b4ceSAdam Hornacek %%
29*d219b4ceSAdam Hornacek %public
30*d219b4ceSAdam Hornacek %class PlainXref
31*d219b4ceSAdam Hornacek %extends JFlexSymbolMatcher
32*d219b4ceSAdam Hornacek %unicode
33*d219b4ceSAdam Hornacek %ignorecase
34*d219b4ceSAdam Hornacek %int
35*d219b4ceSAdam Hornacek %char
36*d219b4ceSAdam Hornacek %include ../CommonLexer.lexh
37*d219b4ceSAdam Hornacek %include ../CommonXref.lexh
38*d219b4ceSAdam Hornacek 
39*d219b4ceSAdam Hornacek File = {FNameChar}+ "." ([a-zA-Z]+) {FNameChar}*
40*d219b4ceSAdam Hornacek 
41*d219b4ceSAdam Hornacek %include ../Common.lexh
42*d219b4ceSAdam Hornacek %include ../CommonURI.lexh
43*d219b4ceSAdam Hornacek %include ../CommonPath.lexh
44*d219b4ceSAdam Hornacek %include ../CommonLaxFPath.lexh
45*d219b4ceSAdam Hornacek %%
46*d219b4ceSAdam Hornacek {File} | {RelaxedMiddleFPath}
47*d219b4ceSAdam Hornacek         {
48*d219b4ceSAdam Hornacek         phLOC();
49*d219b4ceSAdam Hornacek         String s=yytext();
50*d219b4ceSAdam Hornacek         onFilelikeMatched(s, yychar);
51*d219b4ceSAdam Hornacek  }
52*d219b4ceSAdam Hornacek 
53*d219b4ceSAdam Hornacek {BrowseableURI}    {
54*d219b4ceSAdam Hornacek           phLOC();
55*d219b4ceSAdam Hornacek           onUriMatched(yytext(), yychar);
56*d219b4ceSAdam Hornacek         }
57*d219b4ceSAdam Hornacek 
58*d219b4ceSAdam Hornacek {FNameChar}+ "@" {FNameChar}+ "." {FNameChar}+
59*d219b4ceSAdam Hornacek         {
60*d219b4ceSAdam Hornacek           phLOC();
61*d219b4ceSAdam Hornacek           onEmailAddressMatched(yytext(), yychar);
62*d219b4ceSAdam Hornacek         }
63*d219b4ceSAdam Hornacek 
64*d219b4ceSAdam Hornacek // Bug #13362: If there's a very long sequence that matches {FNameChar}+,
65*d219b4ceSAdam Hornacek // parsing the file will take forever because of all the backtracking. With
66*d219b4ceSAdam Hornacek // this rule, we avoid much of the backtracking and speed up the parsing
67*d219b4ceSAdam Hornacek // (in some cases from hours to seconds!). This rule will not interfere with
68*d219b4ceSAdam Hornacek // the rules above because JFlex always picks the longest match.
69*d219b4ceSAdam Hornacek {FNameChar}+    { phLOC(); onNonSymbolMatched(yytext(), yychar); }
70*d219b4ceSAdam Hornacek 
71*d219b4ceSAdam Hornacek {WhspChar}*{EOL}    { onEndOfLineMatched(yytext(), yychar); }
72*d219b4ceSAdam Hornacek [[\s]--[\n]]    { onNonSymbolMatched(yytext(), yychar); }
73*d219b4ceSAdam Hornacek [^\n]    { phLOC(); onNonSymbolMatched(yytext(), yychar); }
74