fix

JingsongLi · JingsongLi · commit 3959a60bd3a1 · 2026-03-08T09:52:37.000+08:00
diff --git a/docs/content/pypaimon/cli.md b/docs/content/pypaimon/cli.md
@@ -127,7 +127,7 @@ Output:
 
 ### Table Get
 
-Get and display detailed schema information about a Paimon table.
+Get and display table schema information in JSON format. The output format is the same as the schema JSON format used in table create, making it easy to export and reuse table schemas.
 
 ```shell
 paimon table get DATABASE.TABLE
@@ -140,107 +140,67 @@ paimon table get mydb.users
 ```
 
 Output:
+```json
+{
+  "fields": [
+    {"id": 0, "name": "user_id", "type": "BIGINT"},
+    {"id": 1, "name": "username", "type": "STRING"},
+    {"id": 2, "name": "email", "type": "STRING"},
+    {"id": 3, "name": "age", "type": "INT"},
+    {"id": 4, "name": "city", "type": "STRING"},
+    {"id": 5, "name": "created_at", "type": "TIMESTAMP"},
+    {"id": 6, "name": "is_active", "type": "BOOLEAN"}
+  ],
+  "partitionKeys": ["city"],
+  "primaryKeys": ["user_id"],
+  "options": {
+    "bucket": "4",
+    "changelog-producer": "input"
+  },
+  "comment": "User information table"
+}
 ```
-================================================================================
-Table: mydb.users
-================================================================================
-
-Schema ID: 0
-
-Comment: User information table
 
-================================================================================
-Fields:
-================================================================================
-ID    Name              Type                 Nullable   Description
------ ------------------ -------------------- --------- --------------------------
-0     user_id           BIGINT               YES        
-1     username          STRING               YES        
-2     email             STRING               YES        
-3     age               INT                  YES        
-4     city              STRING               YES        
-5     created_at        TIMESTAMP(6)         YES        
-6     is_active         BOOLEAN              YES        
-
-================================================================================
-Partition Keys: city
-
-================================================================================
-Primary Keys: user_id
-
-================================================================================
-Table Options:
-================================================================================
-  bucket                                   = 4
-  changelog-producer                       = input
-```
+**Note:** The output JSON can be saved to a file and used directly with the `table create` command to recreate the table structure.
 
 ### Table Create
 
-Create a new Paimon table with a schema defined in a JSON or YAML file.
+Create a new Paimon table with a schema defined in a JSON file. The schema JSON format is the same as the output from `table get`, ensuring consistency and easy schema reuse.
 
 ```shell
-paimon table create DATABASE.TABLE --schema-file SCHEMA_FILE
+paimon table create DATABASE.TABLE --schema SCHEMA_FILE
 ```
 
 **Options:**
 
-- `--schema-file, -s`: Path to schema definition file (JSON or YAML) - **Required**
+- `--schema, -s`: Path to schema JSON file - **Required**
 - `--ignore-if-exists, -i`: Do not raise error if table already exists
 
-The schema file should be a JSON or YAML file with the following structure:
+The schema JSON file follows the same format as output by `table get`:
 
-**JSON Example (`schema.json`):**
+**Field Properties:**
 
-```json
-{
-  "fields": [
-    {"name": "user_id", "type": "BIGINT"},
-    {"name": "username", "type": "STRING"},
-    {"name": "email", "type": "STRING"},
-    {"name": "age", "type": "INT"},
-    {"name": "city", "type": "STRING"},
-    {"name": "created_at", "type": "TIMESTAMP"},
-    {"name": "is_active", "type": "BOOLEAN"}
-  ],
-  "partition_keys": ["city"],
-  "primary_keys": ["user_id"],
-  "options": {
-    "bucket": "4",
-    "changelog-producer": "input"
-  },
-  "comment": "User information table"
-}
-```
+- `id`: Field ID (integer, typically starts from 0) - **Required**
+- `name`: Field name - **Required**
+- `type`: Field data type (e.g., `INT`, `BIGINT`, `STRING`, `TIMESTAMP`, `DECIMAL(10,2)`) - **Required**
+- `description`: Optional field description
 
-**YAML Example (`schema.yaml`):**
+**Schema Properties:**
 
-```yaml
-fields:
-  - name: user_id
-    type: BIGINT
-  - name: username
-    type: STRING
-  - name: email
-    type: STRING
-  - name: age
-    type: INT
-  - name: city
-    type: STRING
-  - name: created_at
-    type: TIMESTAMP
-  - name: is_active
-    type: BOOLEAN
-
-partition_keys:
-  - city
-
-primary_keys:
-  - user_id
-
-options:
-  bucket: "4"
-  changelog-producer: input
-
-comment: User information table
-```
+- `fields`: List of field definitions - **Required**
+- `partitionKeys`: List of partition key column names
+- `primaryKeys`: List of primary key column names
+- `options`: Table options as key-value pairs
+- `comment`: Table comment
+
+**Example Workflow:**
+
+1. Export schema from an existing table:
+   ```shell
+   paimon table get mydb.users > users_schema.json
+   ```
+
+2. Create a new table with the same schema:
+   ```shell
+   paimon table create mydb.users_copy --schema users_schema.json
+   ```
diff --git a/paimon-python/pypaimon/cli/cli_table.py b/paimon-python/pypaimon/cli/cli_table.py
@@ -22,6 +22,7 @@
 """
 
 import sys
+from pypaimon.common.json_util import JSON
 
 
 def cmd_table_read(args):
@@ -85,7 +86,7 @@ def cmd_table_get(args):
     """
     Execute the 'table get' command.
     
-    Gets and displays table schema information.
+    Gets and displays table schema information in JSON format.
     
     Args:
         args: Parsed command line arguments.
@@ -116,52 +117,9 @@ def cmd_table_get(args):
         print(f"Error: Failed to get table '{table_identifier}': {e}", file=sys.stderr)
         sys.exit(1)
     
-    # Get table schema
-    schema = table.table_schema
-    
-    # Display table information
-    print("=" * 80)
-    print(f"Table: {database_name}.{table_name}")
-    print("=" * 80)
-    
-    # Display schema ID
-    print(f"\nSchema ID: {schema.id}")
-    
-    # Display comment if exists
-    if schema.comment:
-        print(f"\nComment: {schema.comment}")
-    
-    # Display fields
-    print(f"\n{'='*80}")
-    print("Fields:")
-    print(f"{'='*80}")
-    print(f"{'ID':<5} {'Name':<18} {'Type':<20} {'Nullable':<9} {'Description'}")
-    print(f"{'-'*5} {'-'*18} {'-'*20} {'-'*9} {'-'*26}")
-    
-    for field in schema.fields:
-        nullable = "YES" if field.type.nullable else "NO"
-        description = field.description or ""
-        print(f"{field.id:<5} {field.name:<18} {str(field.type):<20} {nullable:<9} {description}")
-    
-    # Display partition keys
-    if schema.partition_keys:
-        print(f"\n{'='*80}")
-        print(f"Partition Keys: {', '.join(schema.partition_keys)}")
-    
-    # Display primary keys
-    if schema.primary_keys:
-        print(f"\n{'='*80}")
-        print(f"Primary Keys: {', '.join(schema.primary_keys)}")
-    
-    # Display options
-    if schema.options:
-        print(f"\n{'='*80}")
-        print("Table Options:")
-        print(f"{'='*80}")
-        for key, value in sorted(schema.options.items()):
-            print(f"  {key:<40} = {value}")
-    
-    print(f"\n{'='*80}\n")
+    # Get table schema and convert to Schema, then output as JSON
+    schema = table.table_schema.to_schema()
+    print(JSON.to_json(schema, indent=2))
 
 
 def cmd_table_create(args):
@@ -174,7 +132,6 @@ def cmd_table_create(args):
         args: Parsed command line arguments.
     """
     import json
-    import yaml
     from pypaimon.cli.cli import load_catalog_config, create_catalog
     from pypaimon import Schema
     
@@ -195,72 +152,29 @@ def cmd_table_create(args):
     
     database_name, table_name = parts
     
-    # Load schema from file
-    schema_file = args.schema_file
+    # Load schema from JSON file
+    schema_file = args.schema
     if not schema_file:
-        print("Error: Schema file is required. Use --schema-file option.", file=sys.stderr)
+        print("Error: Schema is required. Use --schema option.", file=sys.stderr)
         sys.exit(1)
     
     try:
         with open(schema_file, 'r', encoding='utf-8') as f:
-            if schema_file.endswith('.json'):
-                schema_def = json.load(f)
-            elif schema_file.endswith('.yaml') or schema_file.endswith('.yml'):
-                schema_def = yaml.safe_load(f)
-            else:
-                print("Error: Unsupported schema file format. Use .json, .yaml, or .yml", file=sys.stderr)
-                sys.exit(1)
+            schema_json = f.read()
+        paimon_schema = JSON.from_json(schema_json, Schema)
+        
     except FileNotFoundError:
         print(f"Error: Schema file not found: {schema_file}", file=sys.stderr)
         sys.exit(1)
+    except json.JSONDecodeError as e:
+        print(f"Error: Invalid JSON format in schema file: {e}", file=sys.stderr)
+        sys.exit(1)
     except Exception as e:
-        print(f"Error: Failed to read schema file: {e}", file=sys.stderr)
+        print(f"Error: Failed to parse schema: {e}", file=sys.stderr)
         sys.exit(1)
     
-    # Parse schema definition
+    # Create table
     try:
-        # Validate required fields
-        if 'fields' not in schema_def:
-            print("Error: Schema must contain 'fields' section", file=sys.stderr)
-            sys.exit(1)
-        
-        # Build PyArrow schema from definition
-        import pyarrow as pa
-        pa_fields = []
-        for field in schema_def['fields']:
-            field_name = field.get('name')
-            field_type = field.get('type')
-            
-            if not field_name or not field_type:
-                print("Error: Each field must have 'name' and 'type'", file=sys.stderr)
-                sys.exit(1)
-            
-            # Convert type string to PyArrow type
-            from pypaimon.schema.data_types import DataTypeParser, PyarrowFieldParser
-
-            # Parse type string to Paimon DataType, then convert to PyArrow type
-            paimon_type = DataTypeParser.parse_data_type(field_type)
-            pa_type = PyarrowFieldParser.from_paimon_type(paimon_type)
-            pa_fields.append(pa.field(field_name, pa_type))
-        
-        pa_schema = pa.schema(pa_fields)
-        
-        # Extract optional parameters
-        partition_keys = schema_def.get('partition_keys', [])
-        primary_keys = schema_def.get('primary_keys', [])
-        options = schema_def.get('options', {})
-        comment = schema_def.get('comment')
-        
-        # Create Paimon schema
-        paimon_schema = Schema.from_pyarrow_schema(
-            pa_schema,
-            partition_keys=partition_keys if partition_keys else None,
-            primary_keys=primary_keys if primary_keys else None,
-            options=options if options else None,
-            comment=comment
-        )
-        
-        # Create table
         ignore_if_exists = args.ignore_if_exists
         catalog.create_table(f"{database_name}.{table_name}", paimon_schema, ignore_if_exists)
         
@@ -309,9 +223,9 @@ def add_table_subcommands(table_parser):
         help='Table identifier in format: database.table'
     )
     create_parser.add_argument(
-        '--schema-file', '-s',
+        '--schema', '-s',
         required=True,
-        help='Path to schema definition file (JSON or YAML)'
+        help='Path to schema JSON file'
     )
     create_parser.add_argument(
         '--ignore-if-exists', '-i',
diff --git a/paimon-python/pypaimon/tests/cli_test.py b/paimon-python/pypaimon/tests/cli_test.py