parser: cached tokens (second step)

pull/2126/head
Alexander Medvednikov 2019-09-26 05:28:43 +03:00
parent a45255337d
commit da43267e09
8 changed files with 149 additions and 104 deletions

View File

@ -7,6 +7,7 @@ module main
import ( import (
vweb.tmpl // for `$vweb_html()` vweb.tmpl // for `$vweb_html()`
os os
strings
) )
fn (p mut Parser) comp_time() { fn (p mut Parser) comp_time() {
@ -244,21 +245,47 @@ fn (p mut Parser) gen_array_str(typ Type) {
!p.table.type_has_method(elm_type2, 'str') { !p.table.type_has_method(elm_type2, 'str') {
p.error('cant print ${elm_type}[], unhandled print of ${elm_type}') p.error('cant print ${elm_type}[], unhandled print of ${elm_type}')
} }
p.cgen.fns << ' p.v.vgen_file.writeln('
string ${typ.name}_str($typ.name a) { fn (a $typ.name) str() string {
strings__Builder sb = strings__new_builder(a.len * 3); mut sb := strings.new_builder(a.len * 3)
strings__Builder_write(&sb, tos2("[")) ; sb.write("[")
for (int i = 0; i < a.len; i++) { for i, elm in a {
strings__Builder_write(&sb, ${elm_type}_str( (($elm_type *) a.data)[i])); sb.write(elm.str())
if i < a.len - 1 {
if (i < a.len - 1) { sb.write(", ")
strings__Builder_write(&sb, tos2(", ")) ; }
} }
sb.write("]")
return sb.str()
} }
strings__Builder_write(&sb, tos2("]")) ; ')
return strings__Builder_str(sb); p.cgen.fns << 'string ${typ.name}_str();'
} ' }
// `Foo { bar: 3, baz: 'hi' }` => '{ bar: 3, baz: "hi" }'
fn (p mut Parser) gen_struct_str(typ Type) {
p.add_method(typ.name, Fn{
name: 'str'
typ: 'string'
args: [Var{typ: typ.name, is_arg:true}]
is_method: true
is_public: true
receiver_typ: typ.name
})
mut sb := strings.new_builder(typ.fields.len * 20)
sb.writeln('fn (a $typ.name) str() string {\nreturn')
sb.writeln("'{")
for field in typ.fields {
sb.writeln('\t$field.name: \$a.${field.name}')
}
sb.writeln("\n}'")
sb.writeln('}')
p.v.vgen_file.writeln(sb.str())
// Need to manually add the definition to `fns` so that it stays
// at the top of the file.
// This function will get parsee by V after the main pass.
p.cgen.fns << 'string ${typ.name}_str();'
} }

View File

@ -127,8 +127,12 @@ fn (p mut Parser) register_var(v Var) {
fn (p mut Parser) clear_vars() { fn (p mut Parser) clear_vars() {
// shared a := [1, 2, 3] // shared a := [1, 2, 3]
p.var_idx = 0 p.var_idx = 0
p.local_vars.free() if p.local_vars.len > 0 {
p.local_vars = []Var if p.pref.autofree {
p.local_vars.free()
}
p.local_vars = []Var
}
} }
// vlib header file? // vlib header file?
@ -173,7 +177,8 @@ fn (p mut Parser) fn_decl() {
p.error('invalid receiver type `$receiver_typ` (`$receiver_typ` is an interface)') p.error('invalid receiver type `$receiver_typ` (`$receiver_typ` is an interface)')
} }
// Don't allow modifying types from a different module // Don't allow modifying types from a different module
if !p.first_pass() && !p.builtin_mod && T.mod != p.mod { if !p.first_pass() && !p.builtin_mod && T.mod != p.mod &&
!p.fileis(vgen_file_name) { // allow .str() on builtin arrays
println('T.mod=$T.mod') println('T.mod=$T.mod')
println('p.mod=$p.mod') println('p.mod=$p.mod')
p.error('cannot define new methods on non-local type `$receiver_typ`') p.error('cannot define new methods on non-local type `$receiver_typ`')
@ -918,21 +923,13 @@ fn (p mut Parser) fn_call_args(f mut Fn) &Fn {
p.cgen.set_placeholder(ph, '${typ}_str(') p.cgen.set_placeholder(ph, '${typ}_str(')
p.gen(')') p.gen(')')
continue continue
} } else if T.cat == .struct_ {
p.gen_struct_str(T)
p.cgen.set_placeholder(ph, '${typ}_str(')
p.gen(')')
continue
}
error_msg := ('`$typ` needs to have method `str() string` to be printable') error_msg := ('`$typ` needs to have method `str() string` to be printable')
if T.fields.len > 0 {
mut index := p.cgen.cur_line.len - 1
for index > 0 && p.cgen.cur_line[index - 1] != `(` { index-- }
name := p.cgen.cur_line.right(index + 1)
if name == '}' {
p.error(error_msg)
}
p.cgen.resetln(p.cgen.cur_line.left(index))
p.scanner.create_type_string(T, name)
p.cgen.cur_line.replace(typ, '')
p.next()
return p.fn_call_args(mut f)
}
p.error(error_msg) p.error(error_msg)
} }
p.cgen.set_placeholder(ph, '${typ}_str(') p.cgen.set_placeholder(ph, '${typ}_str(')
@ -1029,7 +1026,6 @@ fn (p mut Parser) fn_call_args(f mut Fn) &Fn {
p.error('wrong number of arguments for fn `$f.name`: expected $f.args.len, but got more') p.error('wrong number of arguments for fn `$f.name`: expected $f.args.len, but got more')
} }
p.check(.rpar) p.check(.rpar)
// p.gen(')')
return f // TODO is return f right? return f // TODO is return f right?
} }

View File

@ -74,6 +74,7 @@ mut:
vroot string vroot string
mod string // module being built with -lib mod string // module being built with -lib
parsers []Parser parsers []Parser
vgen_file os.File
} }
struct Preferences { struct Preferences {
@ -153,6 +154,8 @@ fn main() {
vfmt(args) vfmt(args)
return return
} }
// Construct the V object from command line arguments // Construct the V object from command line arguments
mut v := new_v(args) mut v := new_v(args)
if args.join(' ').contains(' test v') { if args.join(' ').contains(' test v') {
@ -223,13 +226,9 @@ fn (v mut V) compile() {
if os.user_os() != 'windows' && v.os == .msvc { if os.user_os() != 'windows' && v.os == .msvc {
verror('Cannot build with msvc on ${os.user_os()}') verror('Cannot build with msvc on ${os.user_os()}')
} }
mut cgen := v.cgen mut cgen := v.cgen
cgen.genln('// Generated by V') cgen.genln('// Generated by V')
// Add builtin parsers
for i, file in v.files {
// v.parsers << v.new_parser(file)
}
if v.pref.is_verbose { if v.pref.is_verbose {
println('all .v files before:') println('all .v files before:')
println(v.files) println(v.files)
@ -239,11 +238,24 @@ fn (v mut V) compile() {
println('all .v files:') println('all .v files:')
println(v.files) println(v.files)
} }
if v.pref.is_debug {
println('\nparsers:')
for q in v.parsers {
println(q.file_name)
}
println('\nfiles:')
for q in v.files {
println(q)
}
}
// First pass (declarations) // First pass (declarations)
for file in v.files { for file in v.files {
mut p := v.new_parser(file) for i, p in v.parsers {
p.parse(.decl) if p.file_path == file {
//if p.pref.autofree { p.scanner.text.free() free(p.scanner) } v.parsers[i].parse(.decl)
break
}
}
} }
// Main pass // Main pass
cgen.pass = Pass.main cgen.pass = Pass.main
@ -279,13 +291,15 @@ fn (v mut V) compile() {
v.dir.contains('/ui'))) { v.dir.contains('/ui'))) {
cgen.genln('id defaultFont = 0; // main.v') cgen.genln('id defaultFont = 0; // main.v')
} }
// We need the cjson header for all the json decoding user will do in default mode // We need the cjson header for all the json decoding that will be done in
// default mode
if v.pref.build_mode == .default_mode { if v.pref.build_mode == .default_mode {
if imports_json { if imports_json {
cgen.genln('#include "cJSON.h"') cgen.genln('#include "cJSON.h"')
} }
} }
if v.pref.build_mode == .embed_vlib || v.pref.build_mode == .default_mode { if v.pref.build_mode == .embed_vlib || v.pref.build_mode == .default_mode {
//if v.pref.build_mode in [.embed_vlib, .default_mode] {
// If we declare these for all modes, then when running `v a.v` we'll get // If we declare these for all modes, then when running `v a.v` we'll get
// `/usr/bin/ld: multiple definition of 'total_m'` // `/usr/bin/ld: multiple definition of 'total_m'`
// TODO // TODO
@ -294,7 +308,7 @@ fn (v mut V) compile() {
$if !js { $if !js {
cgen.genln('int g_test_ok = 1; ') cgen.genln('int g_test_ok = 1; ')
} }
if 'json' in v.table.imports { if imports_json {
cgen.genln(' cgen.genln('
#define js_get(object, key) cJSON_GetObjectItemCaseSensitive((object), (key)) #define js_get(object, key) cJSON_GetObjectItemCaseSensitive((object), (key))
') ')
@ -307,8 +321,12 @@ fn (v mut V) compile() {
cgen.genln('this line will be replaced with definitions') cgen.genln('this line will be replaced with definitions')
defs_pos := cgen.lines.len - 1 defs_pos := cgen.lines.len - 1
for file in v.files { for file in v.files {
mut p := v.new_parser(file) for i, p in v.parsers {
p.parse(.main) if p.file_path == file {
v.parsers[i].parse(.main)
break
}
}
//if p.pref.autofree { p.scanner.text.free() free(p.scanner) } //if p.pref.autofree { p.scanner.text.free() free(p.scanner) }
// p.g.gen_x64() // p.g.gen_x64()
// Format all files (don't format automatically generated vlib headers) // Format all files (don't format automatically generated vlib headers)
@ -316,6 +334,10 @@ fn (v mut V) compile() {
// new vfmt is not ready yet // new vfmt is not ready yet
} }
} }
// Close the file with generated V code (str() methods etc) and parse it
v.vgen_file.close()
mut vgen_parser := v.new_parser(vgen_file_name)
vgen_parser.parse(.main)
v.log('Done parsing.') v.log('Done parsing.')
// Write everything // Write everything
mut d := strings.new_builder(10000)// Avoid unnecessary allocations mut d := strings.new_builder(10000)// Avoid unnecessary allocations
@ -335,8 +357,7 @@ fn (v mut V) compile() {
d.writeln('; // Prof counters:') d.writeln('; // Prof counters:')
d.writeln(v.prof_counters()) d.writeln(v.prof_counters())
} }
dd := d.str() cgen.lines[defs_pos] = d.str()
cgen.lines[defs_pos] = dd// TODO `def.str()` doesn't compile
v.generate_main() v.generate_main()
v.generate_hot_reload_code() v.generate_hot_reload_code()
if v.pref.is_verbose { if v.pref.is_verbose {
@ -716,6 +737,10 @@ fn (v &V) log(s string) {
} }
fn new_v(args[]string) &V { fn new_v(args[]string) &V {
os.rm(vgen_file_name)
vgen_file := os.open_append(vgen_file_name) or { panic(err) }
vgen_file.writeln('module main\nimport strings')
joined_args := args.join(' ') joined_args := args.join(' ')
target_os := get_arg(joined_args, 'os', '') target_os := get_arg(joined_args, 'os', '')
mut out_name := get_arg(joined_args, 'o', 'a.out') mut out_name := get_arg(joined_args, 'o', 'a.out')
@ -907,6 +932,7 @@ fn new_v(args[]string) &V {
vroot: vroot vroot: vroot
pref: pref pref: pref
mod: mod mod: mod
vgen_file: vgen_file
} }
} }

View File

@ -9,12 +9,17 @@ import (
strings strings
) )
const (
vgen_file_name = 'vgen.tmp'
)
// TODO rename to Token // TODO rename to Token
// TODO rename enum Token to TokenType // TODO rename enum Token to TokenType
struct Tok { struct Tok {
tok Token tok Token
lit string lit string
line_nr int line_nr int
name_idx int // name table index for O(1) lookup
// col int // col int
} }
@ -103,6 +108,8 @@ fn (v mut V) new_parser(path string) Parser {
break break
} }
} }
//vgen_file := os.open_append(vgen_file_name) or { panic(err) }
mut p := Parser { mut p := Parser {
v: v v: v
@ -120,7 +127,6 @@ fn (v mut V) new_parser(path string) Parser {
os: v.os os: v.os
vroot: v.vroot vroot: v.vroot
local_vars: [Var{}].repeat(MaxLocalVars) local_vars: [Var{}].repeat(MaxLocalVars)
} }
$if js { $if js {
p.is_js = true p.is_js = true
@ -144,7 +150,15 @@ fn (v mut V) new_parser(path string) Parser {
break break
} }
} }
v.add_parser(p)
/*
if !(p in v.parsers) {
v.parsers << p
}
*/
//p.next() //p.next()
//p.scanner.debug_tokens() //p.scanner.debug_tokens()
return p return p
@ -202,6 +216,7 @@ fn (p & Parser) peek() Token {
/*
fn (p mut Parser) next_old() { fn (p mut Parser) next_old() {
p.prev_tok2 = p.prev_tok p.prev_tok2 = p.prev_tok
p.prev_tok = p.tok p.prev_tok = p.tok
@ -210,6 +225,7 @@ fn (p mut Parser) next_old() {
p.tok = res.tok p.tok = res.tok
p.lit = res.lit p.lit = res.lit
} }
*/
fn (p &Parser) log(s string) { fn (p &Parser) log(s string) {
/* /*
@ -423,7 +439,7 @@ fn (p mut Parser) import_statement() {
if p.tok != .name { if p.tok != .name {
p.error('bad import format') p.error('bad import format')
} }
if p.peek() == .number && p.scanner.text[p.scanner.pos + 1] == `.` { if p.peek() == .number { // && p.scanner.text[p.scanner.pos + 1] == `.` {
p.error('bad import format. module/submodule names cannot begin with a number') p.error('bad import format. module/submodule names cannot begin with a number')
} }
mut mod := p.check_name().trim_space() mut mod := p.check_name().trim_space()
@ -842,15 +858,18 @@ fn (p mut Parser) check(expected Token) {
print_backtrace() print_backtrace()
p.error(s) p.error(s)
} }
/*
if expected == .rcbr { if expected == .rcbr {
p.fmt_dec() p.fmt_dec()
} }
p.fgen(p.strtok()) p.fgen(p.strtok())
// vfmt: increase indentation on `{` unless it's `{}` // vfmt: increase indentation on `{` unless it's `{}`
// TODO
if expected == .lcbr && p.scanner.pos + 1 < p.scanner.text.len && p.scanner.text[p.scanner.pos + 1] != `}` { if expected == .lcbr && p.scanner.pos + 1 < p.scanner.text.len && p.scanner.text[p.scanner.pos + 1] != `}` {
p.fgenln('') p.fgenln('')
p.fmt_inc() p.fmt_inc()
} }
*/
p.next() p.next()
if p.scanner.line_comment != '' { if p.scanner.line_comment != '' {
@ -3896,6 +3915,10 @@ fn (p mut Parser) check_and_register_used_imported_type(typ_name string) {
} }
fn (p mut Parser) check_unused_imports() { fn (p mut Parser) check_unused_imports() {
// Don't run in the generated V file with `.str()`
if p.fileis(vgen_file_name) {
return
}
mut output := '' mut output := ''
for alias, mod in p.import_table.imports { for alias, mod in p.import_table.imports {
if !p.import_table.is_used_import(alias) { if !p.import_table.is_used_import(alias) {

View File

@ -38,11 +38,11 @@ mut:
fn new_scanner(file_path string) &Scanner { fn new_scanner(file_path string) &Scanner {
if !os.file_exists(file_path) { if !os.file_exists(file_path) {
verror('"$file_path" doesn\'t exist') verror("$file_path doesn't exist")
} }
mut raw_text := os.read_file(file_path) or { mut raw_text := os.read_file(file_path) or {
verror('scanner: failed to open "$file_path"') verror('scanner: failed to open $file_path')
return 0 return 0
} }
@ -660,14 +660,15 @@ fn (s &Scanner) error(msg string) {
println(pointerline) println(pointerline)
} }
fullpath := os.realpath( s.file_path ) fullpath := os.realpath( s.file_path )
_ = fullpath
// The filepath:line:col: format is the default C compiler // The filepath:line:col: format is the default C compiler
// error output format. It allows editors and IDE's like // error output format. It allows editors and IDE's like
// emacs to quickly find the errors in the output // emacs to quickly find the errors in the output
// and jump to their source with a keyboard shortcut. // and jump to their source with a keyboard shortcut.
// Using only the filename leads to inability of IDE/editors // Using only the filename leads to inability of IDE/editors
// to find the source file, when it is in another folder. // to find the source file, when it is in another folder.
//println('${s.file_path}:${s.line_nr + 1}:${column+1}: $msg') println('${s.file_path}:${s.line_nr + 1}:${column+1}: $msg')
println('${fullpath}:${s.line_nr + 1}:${column+1}: $msg') //println('${fullpath}:${s.line_nr + 1}:${column+1}: $msg')
exit(1) exit(1)
} }
@ -834,53 +835,8 @@ fn is_nl(c byte) bool {
return c == `\r` || c == `\n` return c == `\r` || c == `\n`
} }
fn (s &Scanner) get_opening_bracket() int {
mut pos := s.pos
mut parentheses := 0
mut inside_string := false
for pos > 0 && s.text[pos] != `\n` {
if s.text[pos] == `)` && !inside_string {
parentheses++
}
if s.text[pos] == `(` && !inside_string {
parentheses--
}
if s.text[pos] == `\'` && s.text[pos - 1] != `\\` && s.text[pos - 1] != `\`` { // ` // apostrophe balance comment. do not remove
inside_string = !inside_string
}
if parentheses == 0 {
break
}
pos--
}
return pos
}
// Foo { bar: 3, baz: 'hi' } => '{ bar: 3, baz: "hi" }'
fn (s mut Scanner) create_type_string(T Type, name string) {
line := s.line_nr
inside_string := s.inside_string
mut newtext := '\'{ '
start := s.get_opening_bracket() + 1
end := s.pos
for i, field in T.fields {
if i != 0 {
newtext += ', '
}
newtext += '$field.name: ' + '$${name}.${field.name}'
}
newtext += ' }\''
s.text = s.text.substr(0, start) + newtext + s.text.substr(end, s.text.len)
s.pos = start - 2
s.line_nr = line
s.inside_string = inside_string
}
fn contains_capital(s string) bool { fn contains_capital(s string) bool {
// for c in s { for c in s {
for i := 0; i < s.len; i++ {
c := s[i]
if c >= `A` && c <= `Z` { if c >= `A` && c <= `Z` {
return true return true
} }

View File

@ -20,8 +20,23 @@ mut:
cflags []CFlag // ['-framework Cocoa', '-lglfw3'] cflags []CFlag // ['-framework Cocoa', '-lglfw3']
fn_cnt int //atomic fn_cnt int //atomic
obfuscate bool obfuscate bool
//names []Name
} }
/*
enum NameCategory {
constant
mod
var
typ
}
struct Name {
cat NameCategory
}
*/
struct GenTable { struct GenTable {
fn_name string fn_name string
mut: mut:

View File

@ -1,9 +1,11 @@
struct Foo { struct Foo {
a int number int
str string
f f64
} }
fn test_array_str() { fn test_array_str() {
f := Foo{34} f := Foo{34, 'hello', 1.2}
println(f) println(f)
//s := f.str() //s := f.str()
//println(s) //println(s)

View File

@ -7,7 +7,7 @@
- remove all compiler memory leaks - remove all compiler memory leaks
- fix child <T> function calls - fix child <T> function calls
+ fix non-ascii rendering in gg (ä, å, etc) + fix non-ascii rendering in gg (ä, å, etc)
- cache all tokens once + cache all tokens once
- enable vfmt - enable vfmt
- bring back vdoc and regenerate all module docs - bring back vdoc and regenerate all module docs
- optimize the parser (reduce map lookups) - optimize the parser (reduce map lookups)