
After go1.16, go will use module mode by default, even when the repository is checked out under GOPATH or in a one-off directory. Add go.mod, go.sum to keep this repo buildable without opting out of the module mode. > go mod init github.com/mmcgrana/gobyexample > go mod tidy > go mod vendor In module mode, the 'vendor' directory is special and its contents will be actively maintained by the go command. pygments aren't the dependency the go will know about, so it will delete the contents from vendor directory. Move it to `third_party` directory now. And, vendor the blackfriday package. Note: the tutorial contents are not affected by the change in go1.16 because all the examples in this tutorial ask users to run the go command with the explicit list of files to be compiled (e.g. `go run hello-world.go` or `go build command-line-arguments.go`). When the source list is provided, the go command does not have to compute the build list and whether it's running in GOPATH mode or module mode becomes irrelevant.
281 lines
4.2 KiB
Plaintext
281 lines
4.2 KiB
Plaintext
/*
|
|
* Lexes Ragel input files.
|
|
*
|
|
* @LANG: c++
|
|
*
|
|
* Test works with split code gen.
|
|
*/
|
|
|
|
#include <iostream>
|
|
#include <stdlib.h>
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
|
|
using namespace std;
|
|
|
|
void escapeXML( const char *data )
|
|
{
|
|
while ( *data != 0 ) {
|
|
switch ( *data ) {
|
|
case '<': cout << "<"; break;
|
|
case '>': cout << ">"; break;
|
|
case '&': cout << "&"; break;
|
|
default: cout << *data; break;
|
|
}
|
|
data += 1;
|
|
}
|
|
}
|
|
|
|
void escapeXML( char c )
|
|
{
|
|
switch ( c ) {
|
|
case '<': cout << "<"; break;
|
|
case '>': cout << ">"; break;
|
|
case '&': cout << "&"; break;
|
|
default: cout << c; break;
|
|
}
|
|
}
|
|
|
|
void escapeXML( const char *data, int len )
|
|
{
|
|
for ( const char *end = data + len; data != end; data++ ) {
|
|
switch ( *data ) {
|
|
case '<': cout << "<"; break;
|
|
case '>': cout << ">"; break;
|
|
case '&': cout << "&"; break;
|
|
default: cout << *data; break;
|
|
}
|
|
}
|
|
}
|
|
|
|
inline void write( const char *data )
|
|
{
|
|
cout << data;
|
|
}
|
|
|
|
inline void write( char c )
|
|
{
|
|
cout << c;
|
|
}
|
|
|
|
inline void write( const char *data, int len )
|
|
{
|
|
cout.write( data, len );
|
|
}
|
|
|
|
|
|
%%{
|
|
machine RagelScan;
|
|
|
|
word = [a-zA-Z_][a-zA-Z_0-9]*;
|
|
integer = [0-9]+;
|
|
hex = '0x' [0-9a-fA-F] [0-9a-fA-F]*;
|
|
|
|
default = ^0;
|
|
EOF = 0;
|
|
|
|
# Handles comments in outside code and inline blocks.
|
|
c_comment :=
|
|
( default* :>> '*/' )
|
|
${ escapeXML( fc ); }
|
|
@{ fret; };
|
|
|
|
action emit {
|
|
escapeXML( ts, te-ts );
|
|
}
|
|
|
|
#
|
|
# Inline action code
|
|
#
|
|
|
|
ilscan := |*
|
|
|
|
"'" ( [^'\\] | /\\./ )* "'" => emit;
|
|
'"' ( [^"\\] | /\\./ )* '"' => emit;
|
|
'/*' {
|
|
write( "/*" );
|
|
fcall c_comment;
|
|
};
|
|
'//' [^\n]* '\n' => emit;
|
|
|
|
'{' {
|
|
write( '{' );
|
|
inline_depth += 1;
|
|
};
|
|
|
|
'}' {
|
|
write( '}' );
|
|
/* If dropping down to the last } then return
|
|
* to ragel code. */
|
|
if ( --inline_depth == 0 ) {
|
|
write( "</inline>\n" );
|
|
fgoto rlscan;
|
|
}
|
|
};
|
|
|
|
default => { escapeXML( *ts ); };
|
|
*|;
|
|
|
|
#
|
|
# Ragel Tokens
|
|
#
|
|
|
|
rlscan := |*
|
|
'}%%' {
|
|
if ( !single_line ) {
|
|
write( "</section>\n" );
|
|
fgoto main;
|
|
}
|
|
};
|
|
|
|
'\n' {
|
|
if ( single_line ) {
|
|
write( "</section>\n" );
|
|
fgoto main;
|
|
}
|
|
};
|
|
|
|
# Word
|
|
word {
|
|
write( "<word>" );
|
|
write( ts, te-ts );
|
|
write( "</word>\n" );
|
|
};
|
|
|
|
# Decimal integer.
|
|
integer {
|
|
write( "<int>" );
|
|
write( ts, te-ts );
|
|
write( "</int>\n" );
|
|
};
|
|
|
|
# Hexidecimal integer.
|
|
hex {
|
|
write( "<hex>" );
|
|
write( ts, te-ts );
|
|
write( "</hex>\n" );
|
|
};
|
|
|
|
# Consume comments.
|
|
'#' [^\n]* '\n';
|
|
|
|
# Single literal string.
|
|
"'" ( [^'\\] | /\\./ )* "'" {
|
|
write( "<single_lit>" );
|
|
escapeXML( ts, te-ts );
|
|
write( "</single_lit>\n" );
|
|
};
|
|
|
|
# Double literal string.
|
|
'"' ( [^"\\] | /\\./ )* '"' {
|
|
write( "<double_lit>" );
|
|
escapeXML( ts, te-ts );
|
|
write( "</double_lit>\n" );
|
|
};
|
|
|
|
# Or literal.
|
|
'[' ( [^\]\\] | /\\./ )* ']' {
|
|
write( "<or_lit>" );
|
|
escapeXML( ts, te-ts );
|
|
write( "</or_lit>\n" );
|
|
};
|
|
|
|
# Regex Literal.
|
|
'/' ( [^/\\] | /\\./ ) * '/' {
|
|
write( "<re_lit>" );
|
|
escapeXML( ts, te-ts );
|
|
write( "</re_lit>\n" );
|
|
};
|
|
|
|
# Open an inline block
|
|
'{' {
|
|
inline_depth = 1;
|
|
write( "<inline>{" );
|
|
fgoto ilscan;
|
|
};
|
|
|
|
punct {
|
|
write( "<symbol>" );
|
|
escapeXML( fc );
|
|
write( "</symbol>\n" );
|
|
};
|
|
|
|
default;
|
|
*|;
|
|
|
|
#
|
|
# Outside code.
|
|
#
|
|
|
|
main := |*
|
|
|
|
"'" ( [^'\\] | /\\./ )* "'" => emit;
|
|
'"' ( [^"\\] | /\\./ )* '"' => emit;
|
|
|
|
'/*' {
|
|
escapeXML( ts, te-ts );
|
|
fcall c_comment;
|
|
};
|
|
|
|
'//' [^\n]* '\n' => emit;
|
|
|
|
'%%{' {
|
|
write( "<section>\n" );
|
|
single_line = false;
|
|
fgoto rlscan;
|
|
};
|
|
|
|
'%%' {
|
|
write( "<section>\n" );
|
|
single_line = true;
|
|
fgoto rlscan;
|
|
};
|
|
|
|
default {
|
|
escapeXML( *ts );
|
|
};
|
|
|
|
# EOF.
|
|
EOF;
|
|
*|;
|
|
}%%
|
|
|
|
%% write data nofinal;
|
|
|
|
void test( const char *data )
|
|
{
|
|
std::ios::sync_with_stdio(false);
|
|
|
|
int cs, act;
|
|
const char *ts, *te;
|
|
int stack[1], top;
|
|
|
|
bool single_line = false;
|
|
int inline_depth = 0;
|
|
|
|
%% write init;
|
|
|
|
/* Read in a block. */
|
|
const char *p = data;
|
|
const char *pe = data + strlen( data );
|
|
const char *eof = pe;
|
|
%% write exec;
|
|
|
|
if ( cs == RagelScan_error ) {
|
|
/* Machine failed before finding a token. */
|
|
cerr << "PARSE ERROR" << endl;
|
|
exit(1);
|
|
}
|
|
}
|
|
|
|
#define BUFSIZE 2048
|
|
|
|
int main()
|
|
{
|
|
std::ios::sync_with_stdio(false);
|
|
|
|
test("hi %%{ /'}%%'/ { /*{*/ {} } + '\\'' }%%there\n");
|
|
|
|
return 0;
|
|
}
|