fix: comment

tanzaku · tanzaku · commit d2216b8f1e87 · 2025-03-15T20:10:34.000+09:00
diff --git a/crates/lexer-generator/src/lexer_generator.rs b/crates/lexer-generator/src/lexer_generator.rs
@@ -4,7 +4,7 @@ use self::flex_file::{parse_flex_file, FlexFile};
 
 mod flex_file;
 
-/// 各状態の全ルールに一意な名前を付ける
+/// Assign unique names to all rules in each state
 fn construct_rule_kinds(flex_file: &FlexFile) -> String {
     let mut res = Vec::new();
     let mut map: HashMap<&String, usize> = HashMap::new();
@@ -20,7 +20,7 @@ fn construct_rule_kinds(flex_file: &FlexFile) -> String {
     res.join(",\n")
 }
 
-/// action部分のコードを生成する
+/// Generate code for the action part
 fn construct_actions(flex_file: &FlexFile) -> String {
     let mut res = Vec::new();
     let mut map: HashMap<&String, usize> = HashMap::new();
@@ -30,7 +30,7 @@ fn construct_actions(flex_file: &FlexFile) -> String {
             let e = map.entry(s).or_default();
             *e += 1;
 
-            // actionが | の場合、後続のルールが実行される
+            // If the action is |, the subsequent rule will be executed
             if rule.actions.trim() == "|" {
                 res.push(format!(
                     r#"RuleKind::{kind}|"#,
@@ -51,17 +51,17 @@ fn construct_actions(flex_file: &FlexFile) -> String {
     res.join("\n")
 }
 
-/// ルールのパターンを正規表現に変換する
+/// Convert rule patterns to regular expressions
 fn extract_rule_pattern(flex_file: &FlexFile, pattern: &str) -> String {
     if pattern == "<<EOF>>" {
         return "^$".to_string();
     }
 
-    // {xxx}のパターンを抽出する正規表現パターン
+    // Regular expression pattern to extract {xxx} patterns
     let p = regex::Regex::new(r#"\{([a-zA-Z0-9_]+)\}"#).unwrap();
 
-    // flexではダブルクオートをエスケープする必要があるが、正規表現では不要である
-    // そのため、正規表現パターンにする前にダブルクオートのエスケープを除外する
+    // In flex, double quotes need to be escaped, but not in regular expressions
+    // Therefore, remove the escaping of double quotes before converting to regex pattern
     fn remove_unnecessary_quote(s: &str) -> String {
         let chars = s.chars().collect::<Vec<_>>();
         let mut remove = vec![false; chars.len()];
@@ -98,11 +98,11 @@ fn extract_rule_pattern(flex_file: &FlexFile, pattern: &str) -> String {
             .collect()
     }
 
-    // {xxx}を実際の正規表現パターンに展開する
+    // Expand {xxx} to actual regular expression patterns
     p.replace_all(&pattern, |caps: &regex::Captures| {
         let name = caps.get(1).unwrap().as_str();
 
-        // {xxx}のxxxが定義されているかをチェックする
+        // Check if xxx in {xxx} is defined
         if let Some(def) = flex_file.definitions.iter().find(|def| def.name == name) {
             let pattern = remove_unnecessary_quote(&def.def);
             let rep = extract_rule_pattern(flex_file, &pattern);
@@ -114,7 +114,7 @@ fn extract_rule_pattern(flex_file: &FlexFile, pattern: &str) -> String {
     .to_string()
 }
 
-/// Rule構造体を生成する
+/// Generate Rule structures
 fn construct_rule_defs(flex_file: &FlexFile) -> String {
     let mut res = Vec::new();
     let mut map: HashMap<&String, usize> = HashMap::new();
@@ -142,12 +142,12 @@ fn construct_rule_defs(flex_file: &FlexFile) -> String {
     res.join(",\n")
 }
 
-/// 状態を表すenumを生成する
+/// Generate enum representing states
 fn construct_states(flex_file: &FlexFile) -> String {
     flex_file.all_states.clone().join(",\n")
 }
 
-/// scan.lに基づいてLexerを生成する
+/// Generate Lexer based on scan.l
 pub fn generate() {
     let flex_file = parse_flex_file(include_str!("../resources/scan.l"));
     let template = include_str!("../templates/lex_template.rs");
@@ -157,7 +157,7 @@ pub fn generate() {
     let rule_defs = construct_rule_defs(&flex_file);
     let states = construct_states(&flex_file);
 
-    // キーワード一覧を抽出する
+    // Extract keyword list
     let mut keywords = Vec::new();
     for line in include_str!("../resources/kwlist.h").lines() {
         if line.starts_with("PG_KEYWORD") {
diff --git a/crates/lexer-generator/templates/lex_template.rs b/crates/lexer-generator/templates/lex_template.rs
@@ -3,7 +3,6 @@
 
 use std::collections::HashMap;
 
-// use regex::{Match, Regex};
 use regex::bytes::Regex;
 
 use super::{
diff --git a/crates/parser-generator/src/parser_generator/bison.rs b/crates/parser-generator/src/parser_generator/bison.rs
@@ -39,12 +39,12 @@ pub enum RawComponent {
 #[derive(Debug, Clone, Copy, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct ComponentId(pub u16);
 
-/// 構文規則のコンポーネント
+/// Component of the syntax rule
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub enum Component {
-    /// 非終端記号
+    /// Non-terminal symbol
     NonTerminal(String),
-    /// 終端記号
+    /// Terminal symbol
     Terminal(TokenKind),
 }
 
@@ -134,25 +134,6 @@ pub struct Bison {
     pub rules: Vec<Rule>,
 
     pub rule_names: Vec<String>,
-    // これ使ってる？
-    // pub comments: Vec<Token>,
-
-    // 構文解析表作るやつなので消す
-    // pub components: Vec<Component>,
-    // pub component_map: HashMap<Component, ComponentId>,
-
-    // pub name_to_rules: HashMap<String, Vec<usize>>,
-
-    // pub first_set: HashMap<ComponentId, HashSet<ComponentId>>,
-    // pub nullable: HashMap<ComponentId, bool>,
-
-    // pub state_set: StateSet,
-    // pub action_table: HashMap<(usize, ComponentId), Action>,
-    // pub goto_table: HashMap<(usize, ComponentId), usize>,
-    // pub accept_rule_component_id: ComponentId,
-    // pub accept_rule_component: Component,
-    // pub end_rule_component_id: ComponentId,
-    // pub end_rule_component: Component,
 }
 
 impl Bison {
@@ -191,7 +172,7 @@ fn parse_type(bison: &mut Bison, line: &str, deq: &mut VecDeque<String>) {
                 .insert(non_terminal_symbol.to_string(), typ.to_string());
         }
 
-        // 空白スタートの場合継続業とみなす
+        // If it starts with a space, consider it as a continuation line
         if deq.front().map_or(false, is_start_whitespace) {
             line = deq.pop_front().unwrap();
         } else {
@@ -221,7 +202,7 @@ fn parse_token(bison: &mut Bison, line: &str, deq: &mut VecDeque<String>) {
             bison.token.insert(terminal_symbol.to_string(), typ.clone());
         }
 
-        // 空白スタートの場合継続業とみなす
+        // If it starts with a space, consider it as a continuation line
         if deq
             .front()
             .map_or(false, |line| is_start_whitespace(line) || line.is_empty())
@@ -249,8 +230,8 @@ fn parse_assoc(
 
     loop {
         for name in line.split_whitespace() {
-            // ブロックコメントの開始を見つけたら終了
-            // 雑だがpostgresqlのgrammerをparseする分には問題ない
+            // If we find the start of a block comment, end
+            // This is rough but works fine for parsing postgresql's grammar
             if name == "/*" {
                 break;
             }
@@ -264,7 +245,7 @@ fn parse_assoc(
             bison.assoc.insert(name.to_string(), assoc);
         }
 
-        // 空白スタートの場合継続業とみなす
+        // If it starts with a space, consider it as a continuation line
         if deq.front().map_or(false, is_start_whitespace) {
             line = deq.pop_front().unwrap();
         } else {
@@ -603,29 +584,6 @@ pub fn parse_bison(s: impl AsRef<str>) -> Bison {
         assoc: HashMap::new(),
         rules: Vec::new(),
         rule_names: Vec::new(),
-        // 未使用
-        // comments: Vec::new(),
-
-        // Lalr構造体に移動
-        // components: Vec::new(),
-        // component_map: HashMap::new(),
-
-        // name_to_rules: HashMap::new(),
-
-        // first_set: HashMap::new(),
-        // nullable: HashMap::new(),
-
-        // state_set: StateSet {
-        //     states: Vec::new(),
-        //     need_update: HashSet::new(),
-        // },
-        // action_table: HashMap::new(),
-        // goto_table: HashMap::new(),
-
-        // accept_rule_component: Component::NonTerminal("dummy".to_string()),
-        // accept_rule_component_id: ComponentId(0),
-        // end_rule_component: Component::NonTerminal("dummy".to_string()),
-        // end_rule_component_id: ComponentId(0),
     };
 
     while let Some(line) = deq.pop_front() {
diff --git a/crates/parser-generator/src/parser_generator/lalr.rs b/crates/parser-generator/src/parser_generator/lalr.rs
@@ -89,7 +89,7 @@ pub struct State {
 }
 
 impl State {
-    // LALR用の差分。先読み記号を無視する
+    // Difference for LALR: ignore lookahead symbols
     fn equals_without_lookahead(&self, other: &State) -> bool {
         if self.items.len() != other.items.len() {
             return false;
@@ -101,7 +101,7 @@ impl State {
             .all(|(l, r)| l.rule_index == r.rule_index && l.dot_pos == r.dot_pos)
     }
 
-    // LALR用の差分。先読み記号を無視する
+    // Difference for LR: Distinguish lookahead symbols
     fn equals(&self, other: &State) -> bool {
         if self.items.len() != other.items.len() {
             return false;
@@ -141,7 +141,7 @@ impl StateSet {
         {
             self.states[from_index].edge.insert((comp, i));
 
-            // 先読み記号まで含めて同一ならスキップ
+            // Skip if it's identical including lookahead symbols
             if state.equals(&self.states[i]) {
                 return;
             }
@@ -375,13 +375,13 @@ impl Lalr {
             .collect();
     }
 
-    // TODO closureをテストする
+    // TODO: Test the closure function
     fn closure(&mut self, state: &mut State) {
         let mut in_deq = vec![false; state.items.len()];
 
         let prev_item_len = state.items.len();
 
-        // LR(1)アイテム集合の単一状態の変化がなくなるまで繰り返す
+        // Repeat until there are no more changes in the LR(1) item set for a single state
         let mut deq = VecDeque::from_iter(0..state.items.len());
         while let Some(j) = deq.pop_front() {
             in_deq[j] = false;
@@ -396,7 +396,7 @@ impl Lalr {
                 continue;
             }
 
-            // ドットの次の要素が非終端記号の場合には、その非終端記号を左辺に持つ全ての規則について、非終端記号の先頭にドットおるアイテムを追加する。
+            // If the element after the dot is a non-terminal symbol, add an item with the dot at the beginning of all rules that have that non-terminal symbol on the left-hand side.
             let component_id = self.rules[rule_index].components[dot_pos];
             if let Component::Terminal(_) = &self.id_mapper.components[component_id.0 as usize] {
                 continue;
@@ -405,7 +405,7 @@ impl Lalr {
             let mut lookaheads = self.first_set_after[rule_index][dot_pos + 1].clone();
             let nullable = self.nullable[rule_index][dot_pos + 1];
 
-            // その際の先読み記号は、first_set(非終端記号の続き + lookahead)で求まる
+            // The lookahead symbols are determined by first_set(continuation of non-terminal + lookahead)
             if nullable {
                 state.items[j]
                     .lookahead
@@ -416,17 +416,17 @@ impl Lalr {
             self.rule_indices_by_name_id[component_id.0 as usize]
                 .iter()
                 .for_each(|&new_item_index| {
-                    // 追加予定のアイテムが既に存在するかチェックする
+                    // Check if the item to be added already exists
                     let j: Option<&usize> = state.item_indices.get(&new_item_index);
 
                     if let Some(&j) = j {
-                        // あれば先読み記号のみ追加
+                        // If it exists, only add lookahead symbols
                         if state.items[j].insert_lookaheads(&lookaheads) && !in_deq[j] {
                             deq.push_back(j);
                             in_deq[j] = true;
                         }
                     } else {
-                        // なければ追加
+                        // If it doesn't exist, add it
                         let new_item = Item {
                             rule_index: new_item_index,
                             dot_pos: 0,
@@ -445,11 +445,11 @@ impl Lalr {
         }
     }
 
-    /// 構文解析表を作成する
-    /// 1. LR(1)項集合の作成
+    /// Create a syntax analysis table
+    /// 1. Create LR(1) item sets
     pub fn build_lalr1_parse_table(&mut self) {
-        // bisonでは明示的に指定しない場合、最初のルールが起点のルールになる
-        // PostgreSQLの場合、明示的に指定していないため、最初のルールを起点とする
+        // In bison, if not explicitly specified, the first rule becomes the starting rule
+        // In the case of PostgreSQL, it's not explicitly specified, so we use the first rule as the starting point
         let start_rule_index = self.rules.len();
         let start_component_id = self.rules[0].name_id;
 
@@ -494,8 +494,8 @@ impl Lalr {
 
             // dbg!(i, state_set.states.len());
 
-            // ドットを進めた状態を作る
-            // ドットを進める状態を、次の記号でグループ化
+            // Create states by advancing the dot
+            // Group the states where the dot is advanced by the next symbol
             let mut next_states: BTreeMap<ComponentId, Vec<_>> = BTreeMap::new();
             for j in 0..state_set.states[i].items.len() {
                 let dot_pos = state_set.states[i].items[j].dot_pos;
@@ -528,7 +528,7 @@ impl Lalr {
 
         dbg!(state_set.states.len());
 
-        // 構文解析表を構築
+        // Build the syntax analysis table
         let mut action_table: HashMap<(usize, ComponentId), Action> = HashMap::new();
         let mut goto_table: HashMap<(usize, ComponentId), usize> = HashMap::new();
 
@@ -577,29 +577,29 @@ impl Lalr {
 
                     match (reduce, shift) {
                         (Some(reduce), Some(shift)) if reduce.priority < shift.priority => {
-                            // shiftを採用
+                            // adopt shift
                         }
                         (Some(reduce), Some(shift)) if reduce.priority > shift.priority => {
-                            // reduceを採用
+                            // adopt reduce
                             action_table.insert(key, reduce_action);
                         }
                         (Some(_), Some(shift)) => {
                             match shift.directive {
                                 AssocDirective::NonAssoc => {
-                                    // このケースはparse error
+                                    // This case is a parse error
                                     action_table.insert(key, Action::Error);
                                 }
                                 AssocDirective::Left => {
-                                    // reduceを採用
+                                    // adopt reduce
                                     action_table.insert(key, reduce_action);
                                 }
                                 AssocDirective::Right => {
-                                    // shiftを採用
+                                    // adopt shift
                                 }
                             }
                         }
                         _ => {
-                            // いずれかに優先度がなければshift優先らしい
+                            // If either one doesn't have a priority, shift seems to be preferred
                         }
                     }
                 }
diff --git a/crates/postgresql-cst-parser/src/lib.rs b/crates/postgresql-cst-parser/src/lib.rs
@@ -20,6 +20,3 @@ pub use cst::SyntaxToken;
 pub fn parse(input: &str) -> Result<ResolvedNode, ParseError> {
     cst::parse(input)
 }
-
-#[cfg(test)]
-mod tests {}

Original file line number	Diff line number	Diff line change
`@@ -20,6 +20,3 @@ pub use cst::SyntaxToken;`
`20`	`20`	`pub fn parse(input: &str) -> Result<ResolvedNode, ParseError> {`
`21`	`21`	`cst::parse(input)`
`22`	`22`	`}`
`23`		`-`
`24`		`-#[cfg(test)]`
`25`		`-mod tests {}`