From 3581ed74fe08ca676f2c3cd6f6fa7db05c9ff09c Mon Sep 17 00:00:00 2001 From: peefy Date: Mon, 6 Nov 2023 20:47:58 +0800 Subject: [PATCH] feat: impl string-like schema attribute parser and ast printer Signed-off-by: peefy --- kclvm/ast/src/token.rs | 14 +++ kclvm/ast_pretty/src/node.rs | 12 ++- .../ast_pretty/src/test_data/codelayout.input | 2 + .../src/test_data/codelayout.output | 2 + kclvm/parser/src/parser/stmt.rs | 62 ++++++++++-- kclvm/parser/src/tests/error_recovery.rs | 13 +++ ...ror_recovery__schema_stmt_recovery_32.snap | 88 +++++++++++++++++ ...ror_recovery__schema_stmt_recovery_33.snap | 97 +++++++++++++++++++ ...ror_recovery__schema_stmt_recovery_34.snap | 54 +++++++++++ ...ror_recovery__schema_stmt_recovery_35.snap | 86 ++++++++++++++++ kclvm/sema/src/resolver/node.rs | 8 +- .../grammar/schema/str_attr/str_attr_0/main.k | 23 +++++ .../schema/str_attr/str_attr_0/stdout.golden | 6 ++ .../grammar/schema/str_attr/str_attr_1/main.k | 22 +++++ .../schema/str_attr/str_attr_1/stdout.golden | 6 ++ 15 files changed, 482 insertions(+), 13 deletions(-) create mode 100644 kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_32.snap create mode 100644 kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_33.snap create mode 100644 kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_34.snap create mode 100644 kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_35.snap create mode 100644 test/grammar/schema/str_attr/str_attr_0/main.k create mode 100644 test/grammar/schema/str_attr/str_attr_0/stdout.golden create mode 100644 test/grammar/schema/str_attr/str_attr_1/main.k create mode 100644 test/grammar/schema/str_attr/str_attr_1/stdout.golden diff --git a/kclvm/ast/src/token.rs b/kclvm/ast/src/token.rs index 177416e33..dfdcc1bdd 100644 --- a/kclvm/ast/src/token.rs +++ b/kclvm/ast/src/token.rs @@ -334,6 +334,20 @@ impl Token { self.run_on_ident(|id| id.name == kw) } + /// Whether the token is a string literal token. + pub fn is_string_lit(&self) -> bool { + match self.kind { + TokenKind::Literal(lit) => { + if let LitKind::Str { .. } = lit.kind { + true + } else { + false + } + } + _ => false, + } + } + fn run_on_ident(&self, pred: impl FnOnce(Ident) -> bool) -> bool { match self.ident() { Some(id) => pred(id), diff --git a/kclvm/ast_pretty/src/node.rs b/kclvm/ast_pretty/src/node.rs index 77fee683a..a785534c3 100644 --- a/kclvm/ast_pretty/src/node.rs +++ b/kclvm/ast_pretty/src/node.rs @@ -345,7 +345,7 @@ impl<'p, 'ctx> MutSelfTypedResultWalker<'ctx> for Printer<'p> { if !schema_attr.decorators.is_empty() { self.write_newline(); } - self.write(&schema_attr.name.node); + self.write_attribute(&schema_attr.name); if schema_attr.is_optional { self.write("?"); } @@ -878,6 +878,16 @@ impl<'p> Printer<'p> { } } } + + fn write_attribute(&mut self, attr: &ast::NodeRef) { + let re = fancy_regex::Regex::new(IDENTIFIER_REGEX).unwrap(); + let need_quote = !re.is_match(&attr.node).unwrap(); + if need_quote { + self.write(&format!("{:?}", attr.node)); + } else { + self.write(&attr.node); + }; + } } impl<'p> Printer<'p> { diff --git a/kclvm/ast_pretty/src/test_data/codelayout.input b/kclvm/ast_pretty/src/test_data/codelayout.input index 46121bd5e..8df50874f 100644 --- a/kclvm/ast_pretty/src/test_data/codelayout.input +++ b/kclvm/ast_pretty/src/test_data/codelayout.input @@ -7,6 +7,8 @@ import math as alias_math schema Person ( Base): name:str age:int + "attr": str + "attr-x": str check : age>0 if age , "age must > 0" person = Person{ diff --git a/kclvm/ast_pretty/src/test_data/codelayout.output b/kclvm/ast_pretty/src/test_data/codelayout.output index b0b658248..d7171dd65 100644 --- a/kclvm/ast_pretty/src/test_data/codelayout.output +++ b/kclvm/ast_pretty/src/test_data/codelayout.output @@ -6,6 +6,8 @@ import math as alias_math schema Person(Base): name: str age: int + attr: str + "attr-x": str check: age > 0 if age, "age must > 0" diff --git a/kclvm/parser/src/parser/stmt.rs b/kclvm/parser/src/parser/stmt.rs index ed5d04fe6..ab2b3a0b7 100644 --- a/kclvm/parser/src/parser/stmt.rs +++ b/kclvm/parser/src/parser/stmt.rs @@ -909,8 +909,16 @@ impl<'a> Parser<'a> { fn parse_schema_body(&mut self) -> SchemaStmt { self.bump_token(TokenKind::Indent); - // doc string - let body_doc = self.parse_doc(); + // doc string when it is not a string-like attribute statement. + let body_doc = if let Some(peek) = self.cursor.peek() { + if matches!(peek.kind, TokenKind::Colon) { + None + } else { + self.parse_doc() + } + } else { + self.parse_doc() + }; // mixin let body_mixins = if self.token.is_keyword(kw::Mixin) { @@ -942,6 +950,20 @@ impl<'a> Parser<'a> { body_body.push(self.parse_if_stmt()); continue; } + // schema_attribute_stmt: string COLON type_annotation + else if self.token.is_string_lit() { + if let Some(peek) = self.cursor.peek() { + if let TokenKind::Colon = peek.kind { + let token = self.token; + let attr = self.parse_schema_attribute(); + body_body.push(node_ref!( + Stmt::SchemaAttr(attr), + self.token_span_pos(token, self.prev_token) + )); + continue; + } + } + } // schema_attribute_stmt else if let TokenKind::At = self.token.kind { let token = self.token; @@ -1133,7 +1155,7 @@ impl<'a> Parser<'a> { /// Syntax: /// schema_attribute_stmt: attribute_stmt NEWLINE - /// attribute_stmt: [decorators] identifier [QUESTION] COLON type [(ASSIGN|COMP_OR) test] + /// attribute_stmt: [decorators] (identifier | string) [QUESTION] COLON type [(ASSIGN|COMP_OR) test] fn parse_schema_attribute(&mut self) -> SchemaAttr { let doc = "".to_string(); @@ -1146,12 +1168,17 @@ impl<'a> Parser<'a> { Vec::new() }; - let name_expr = self.parse_identifier(); - - let name_pos = name_expr.pos(); - let name = name_expr.node; - let name = node_ref!(name.get_names().join("."), name_pos); + // Parse schema identifier-like or string-like attributes + let name = if let Some(name) = self.parse_string_attribute() { + name + } else { + let name_expr = self.parse_identifier(); + let name_pos = name_expr.pos(); + let name = name_expr.node; + node_ref!(name.get_names().join("."), name_pos) + }; + // Parse attribute optional annotation `?` let is_optional = if let TokenKind::Question = self.token.kind { self.bump_token(TokenKind::Question); true @@ -1159,8 +1186,10 @@ impl<'a> Parser<'a> { false }; + // Bump the schema attribute annotation token `:` self.bump_token(TokenKind::Colon); + // Parse the schema attribute type annotation. let typ = self.parse_type_annotation(); let type_str = node_ref!(typ.node.to_string(), typ.pos()); @@ -1479,6 +1508,23 @@ impl<'a> Parser<'a> { ) } + pub(crate) fn parse_string_attribute(&mut self) -> Option> { + match self.token.kind { + TokenKind::Literal(lit) => { + if let LitKind::Str { .. } = lit.kind { + let str_expr = self.parse_str_expr(lit); + match &str_expr.node { + Expr::StringLit(str) => Some(node_ref!(str.value.clone(), str_expr.pos())), + _ => None, + } + } else { + None + } + } + _ => None, + } + } + pub(crate) fn parse_joined_string( &mut self, s: &StringLit, diff --git a/kclvm/parser/src/tests/error_recovery.rs b/kclvm/parser/src/tests/error_recovery.rs index 1c3ab1553..afd73ca3c 100644 --- a/kclvm/parser/src/tests/error_recovery.rs +++ b/kclvm/parser/src/tests/error_recovery.rs @@ -274,6 +274,19 @@ parse_module_snapshot! { schema_stmt_recovery_31, r#" schema A: [str]: str [str]: int"#} +parse_module_snapshot! { schema_stmt_recovery_32, r#" +schema A: + "attr": str"#} +parse_module_snapshot! { schema_stmt_recovery_33, r#" +schema A: + """Schema Doc""" + "attr": str"#} +parse_module_snapshot! { schema_stmt_recovery_34, r#" +schema A: + "attr: str"#} +parse_module_snapshot! { schema_stmt_recovery_35, r#" +schema A: + "attr":"#} parse_module_snapshot! { rule_stmt_recovery_0, r#"rule"#} parse_module_snapshot! { rule_stmt_recovery_1, r#"rule A"#} parse_module_snapshot! { rule_stmt_recovery_2, r#"rule A["#} diff --git a/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_32.snap b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_32.snap new file mode 100644 index 000000000..cc938b07d --- /dev/null +++ b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_32.snap @@ -0,0 +1,88 @@ +--- +source: parser/src/tests/error_recovery.rs +assertion_line: 277 +expression: "crate::tests::parsing_module_string(r#\"\nschema A:\n \"attr\": str\"#)" +--- +Module { + filename: "", + pkg: "", + doc: None, + name: "", + body: [ + Node { + node: Schema( + SchemaStmt { + doc: None, + name: Node { + node: "A", + filename: "", + line: 2, + column: 7, + end_line: 2, + end_column: 8, + }, + parent_name: None, + for_host_name: None, + is_mixin: false, + is_protocol: false, + args: None, + mixins: [], + body: [ + Node { + node: SchemaAttr( + SchemaAttr { + doc: "", + name: Node { + node: "attr", + filename: "", + line: 3, + column: 4, + end_line: 3, + end_column: 10, + }, + type_str: Node { + node: "str", + filename: "", + line: 3, + column: 12, + end_line: 3, + end_column: 15, + }, + op: None, + value: None, + is_optional: false, + decorators: [], + ty: Node { + node: Basic( + Str, + ), + filename: "", + line: 3, + column: 12, + end_line: 3, + end_column: 15, + }, + }, + ), + filename: "", + line: 3, + column: 4, + end_line: 3, + end_column: 15, + }, + ], + decorators: [], + checks: [], + index_signature: None, + }, + ), + filename: "", + line: 2, + column: 0, + end_line: 3, + end_column: 15, + }, + ], + comments: [], +} + diff --git a/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_33.snap b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_33.snap new file mode 100644 index 000000000..76462a4cc --- /dev/null +++ b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_33.snap @@ -0,0 +1,97 @@ +--- +source: parser/src/tests/error_recovery.rs +assertion_line: 280 +expression: "crate::tests::parsing_module_string(r#\"\nschema A:\n \"\"\"Schema Doc\"\"\"\n \"attr\": str\"#)" +--- +Module { + filename: "", + pkg: "", + doc: None, + name: "", + body: [ + Node { + node: Schema( + SchemaStmt { + doc: Some( + Node { + node: "\"\"\"Schema Doc\"\"\"", + filename: "", + line: 3, + column: 4, + end_line: 3, + end_column: 20, + }, + ), + name: Node { + node: "A", + filename: "", + line: 2, + column: 7, + end_line: 2, + end_column: 8, + }, + parent_name: None, + for_host_name: None, + is_mixin: false, + is_protocol: false, + args: None, + mixins: [], + body: [ + Node { + node: SchemaAttr( + SchemaAttr { + doc: "", + name: Node { + node: "attr", + filename: "", + line: 4, + column: 4, + end_line: 4, + end_column: 10, + }, + type_str: Node { + node: "str", + filename: "", + line: 4, + column: 12, + end_line: 4, + end_column: 15, + }, + op: None, + value: None, + is_optional: false, + decorators: [], + ty: Node { + node: Basic( + Str, + ), + filename: "", + line: 4, + column: 12, + end_line: 4, + end_column: 15, + }, + }, + ), + filename: "", + line: 4, + column: 4, + end_line: 4, + end_column: 15, + }, + ], + decorators: [], + checks: [], + index_signature: None, + }, + ), + filename: "", + line: 2, + column: 0, + end_line: 4, + end_column: 15, + }, + ], + comments: [], +} + diff --git a/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_34.snap b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_34.snap new file mode 100644 index 000000000..8b6008a50 --- /dev/null +++ b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_34.snap @@ -0,0 +1,54 @@ +--- +source: parser/src/tests/error_recovery.rs +assertion_line: 284 +expression: "crate::tests::parsing_module_string(r#\"\nschema A:\n \"attr: str\"#)" +--- +Module { + filename: "", + pkg: "", + doc: None, + name: "", + body: [ + Node { + node: Schema( + SchemaStmt { + doc: Some( + Node { + node: "\"attr: str", + filename: "", + line: 3, + column: 4, + end_line: 3, + end_column: 14, + }, + ), + name: Node { + node: "A", + filename: "", + line: 2, + column: 7, + end_line: 2, + end_column: 8, + }, + parent_name: None, + for_host_name: None, + is_mixin: false, + is_protocol: false, + args: None, + mixins: [], + body: [], + decorators: [], + checks: [], + index_signature: None, + }, + ), + filename: "", + line: 2, + column: 0, + end_line: 3, + end_column: 14, + }, + ], + comments: [], +} + diff --git a/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_35.snap b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_35.snap new file mode 100644 index 000000000..21f8d78a7 --- /dev/null +++ b/kclvm/parser/src/tests/snapshots/kclvm_parser__tests__error_recovery__schema_stmt_recovery_35.snap @@ -0,0 +1,86 @@ +--- +source: parser/src/tests/error_recovery.rs +assertion_line: 287 +expression: "crate::tests::parsing_module_string(r#\"\nschema A:\n \"attr\":\"#)" +--- +Module { + filename: "", + pkg: "", + doc: None, + name: "", + body: [ + Node { + node: Schema( + SchemaStmt { + doc: None, + name: Node { + node: "A", + filename: "", + line: 2, + column: 7, + end_line: 2, + end_column: 8, + }, + parent_name: None, + for_host_name: None, + is_mixin: false, + is_protocol: false, + args: None, + mixins: [], + body: [ + Node { + node: SchemaAttr( + SchemaAttr { + doc: "", + name: Node { + node: "attr", + filename: "", + line: 3, + column: 4, + end_line: 3, + end_column: 10, + }, + type_str: Node { + node: "any", + filename: "", + line: 3, + column: 11, + end_line: 3, + end_column: 11, + }, + op: None, + value: None, + is_optional: false, + decorators: [], + ty: Node { + node: Any, + filename: "", + line: 3, + column: 11, + end_line: 3, + end_column: 11, + }, + }, + ), + filename: "", + line: 3, + column: 4, + end_line: 3, + end_column: 11, + }, + ], + decorators: [], + checks: [], + index_signature: None, + }, + ), + filename: "", + line: 2, + column: 0, + end_line: 3, + end_column: 11, + }, + ], + comments: [], +} + diff --git a/kclvm/sema/src/resolver/node.rs b/kclvm/sema/src/resolver/node.rs index a92e237ec..a8e4fd5ef 100644 --- a/kclvm/sema/src/resolver/node.rs +++ b/kclvm/sema/src/resolver/node.rs @@ -631,8 +631,8 @@ impl<'ctx> MutSelfTypedResultWalker<'ctx> for Resolver<'ctx> { range, ); self.any_ty() - } else if let ast::Expr::StringLit(string_lit) = &subscript.value.node { - self.load_attr(value_ty, &string_lit.value, range) + } else if let TypeKind::StrLit(lit_value) = &index_key_ty.kind { + self.load_attr(value_ty, lit_value, range) } else { val_ty.clone() } @@ -656,8 +656,8 @@ impl<'ctx> MutSelfTypedResultWalker<'ctx> for Resolver<'ctx> { range, ); self.any_ty() - } else if let ast::Expr::StringLit(string_lit) = &subscript.value.node { - self.load_attr(value_ty, &string_lit.value, range) + } else if let TypeKind::StrLit(lit_value) = &index_key_ty.kind { + self.load_attr(value_ty, lit_value, range) } else { schema_ty.val_ty() } diff --git a/test/grammar/schema/str_attr/str_attr_0/main.k b/test/grammar/schema/str_attr/str_attr_0/main.k new file mode 100644 index 000000000..a14982d6b --- /dev/null +++ b/test/grammar/schema/str_attr/str_attr_0/main.k @@ -0,0 +1,23 @@ +schema Data: + "spec": Spec + +schema Spec: + "config": Config + +schema Config: + "template": Template + +schema Template: + [...str]: int + "name": str + +data = Data { + spec: { + config: { + template: { + name: "template" + id: 1 + } + } + } +} diff --git a/test/grammar/schema/str_attr/str_attr_0/stdout.golden b/test/grammar/schema/str_attr/str_attr_0/stdout.golden new file mode 100644 index 000000000..373d3582f --- /dev/null +++ b/test/grammar/schema/str_attr/str_attr_0/stdout.golden @@ -0,0 +1,6 @@ +data: + spec: + config: + template: + name: template + id: 1 diff --git a/test/grammar/schema/str_attr/str_attr_1/main.k b/test/grammar/schema/str_attr/str_attr_1/main.k new file mode 100644 index 000000000..14aa70d8f --- /dev/null +++ b/test/grammar/schema/str_attr/str_attr_1/main.k @@ -0,0 +1,22 @@ +schema Data: + "spec": Spec + +schema Spec: + "config": Config + +schema Config: + "template": Template + +schema Template: + "name": str + +data = Data { + spec: { + config: { + template: { + name: "template" + } + } + } +} +name = data["spec"]["config"]["template"].name diff --git a/test/grammar/schema/str_attr/str_attr_1/stdout.golden b/test/grammar/schema/str_attr/str_attr_1/stdout.golden new file mode 100644 index 000000000..d4216f94e --- /dev/null +++ b/test/grammar/schema/str_attr/str_attr_1/stdout.golden @@ -0,0 +1,6 @@ +data: + spec: + config: + template: + name: template +name: template