DolbyUUU
diff --git a/‎README.md
Lines changed: 3 additions & 10 deletions b/‎README.md
Lines changed: 3 additions & 10 deletions
diff --git a/‎format_convertor.py
Lines changed: 18 additions & 5 deletions b/‎format_convertor.py
Lines changed: 18 additions & 5 deletions
@@ -36,6 +36,7 @@ Sudoku puzzles are more than just a game—they are a **rich reasoning benchmark
      - Grids can be serialized in multiple ways (e.g., cell-level, row-level, or grid-level).
      - This allows researchers to explore the **optimal input format for structured data** in LLMs.
    - Sudoku4LLM supports 11 different serialization formats, making it a versatile tool for studying structured data representation.
+   - Researchers can easily design custom serialization formats or explore new structured data representations.
 
 ### 5. **Resistance to Memorization**
    - With **infinite variability** in puzzle generation, Sudoku puzzles are highly resistant to memorization, ensuring that models are genuinely reasoning rather than recalling.
@@ -182,24 +183,16 @@ Modify `config.py` to adjust default settings, including:
 
 ---
 
-## 🤝 Acknowledgements
-
-We would like to thank the following contributors, projects, and resources that inspired or supported this work:
-
-- [Add acknowledgements here.]
-
----
-
 ## 📜 Citation
 
 If you use **Sudoku4LLM** in your research, please cite us:
 
 ```bibtex
 @misc{Sudoku4LLM,
-  author = {Your Name},
+  author = {Yu Wang},
   title = {Sudoku4LLM: A Dataset Generator for Training and Evaluating Reasoning LLMs},
   year = {2025},
-  url = {https://github.com/your-repo/Sudoku4LLM},
+  url = {https://github.com/DolbyUUU/Sudoku4LLM},
   note = {Version 1.0}
 }
 ```
@@ -1,3 +1,5 @@
+# Sudoku4LLM/format_convertor.py
+
 import json
 import os
 from config import SudokuConfig  # Importing the config.py module for format options
@@ -14,7 +16,8 @@ def load_puzzles(self):
         try:
             with open(self.input_jsonl, "r") as file:
                 for line in file:
-                    puzzles.append(json.loads(line)["puzzle"])
+                    puzzle_data = json.loads(line)
+                    puzzles.append(puzzle_data)
         except FileNotFoundError:
             print(f"Error: Input file '{self.input_jsonl}' not found.")
             exit(1)
@@ -105,7 +108,7 @@ def convert_to_xml(self, puzzle):
         return "\n".join(rows)
 
     def convert(self, format_choice):
-        """Convert puzzles to the selected format."""
+        """Convert puzzles to the selected format, include game_rule and directly use config."""
         puzzles = self.load_puzzles()
         converted_puzzles = []
 
@@ -132,11 +135,21 @@ def convert(self, format_choice):
         description, format_function = format_methods[format_choice]
 
         # Apply the selected format method to each puzzle
-        for puzzle in puzzles:
+        for puzzle_data in puzzles:
+            puzzle = puzzle_data["puzzle"]
+            config = puzzle_data["config"]  # Directly use the "config" from the original data
+
+            # Add game rule based on grid size
+            grid_size = config["grid_size"]
+            game_rule = SudokuConfig.get_configs().get(f"{grid_size}x{grid_size}", {}).get("rules", "Unknown rules").strip()
+
+            # Build the converted puzzle data
             converted_puzzles.append({
-                "original_puzzle": puzzle,  # Include the original puzzle for reference
+                "original_puzzle": puzzle,  # Include the original puzzle
                 "converted_puzzle": format_function(puzzle),  # Converted puzzle
-                "format": description  # Metadata: format name
+                "format": description,  # Metadata: format name
+                "game_rule": game_rule,  # Game rule
+                "config": config  # Directly include the original config
             })
 
         # Save all converted puzzles in JSONL format