excel 转 dbf

gaohaikuo1 · 发表于 2024-12-21 14:52:11

import pandas as pd
import dbf

def excel_to_dbf(input_excel_path, sheet_name, output_dbf_path):
"""
将 Excel 的指定工作表导出为 DBF 文件，保留数据类型和列名格式。

参数:
      input_excel_path (str): 输入的 Excel 文件路径。
      sheet_name (str): 需要读取的工作表名称。
      output_dbf_path (str): 导出的 DBF 文件路径。
"""
# 读取 Excel 的指定表
df = pd.read_excel(input_excel_path, sheet_name=sheet_name)

# 定义字段字符串列表，根据数据类型进行动态判断
def get_field_definition(column):
      if df[column].dtype == 'object':  # 字符类型
         return f"{column} C(255)"
      elif pd.api.types.is_integer_dtype(df[column]):  # 整型
         return f"{column} N(20,0)"  # 整型无需小数位，最大宽度20
      elif pd.api.types.is_float_dtype(df[column]):  # 浮点型
         # 判断小数位数
         max_decimal_places = df[column].apply(
            lambda x: len(str(x).split(".")[1]) if pd.notnull(x) and "." in str(x) else 0
         ).max()
         return f"{column} N(18,{min(max_decimal_places, 5)})"  # 浮点型设置小数位，限制最大5位
      elif pd.api.types.is_datetime64_any_dtype(df[column]):  # 日期类型
         return f"{column} D"
      else:
         raise ValueError(f"Unsupported column type for {column}")

# 生成字段定义，确保列名格式不变
field_definitions = ";".join([get_field_definition(col) for col in df.columns])
print(field_definitions)

# 使用指定编码创建 DBF 表
table = dbf.Table(output_dbf_path, field_definitions, codepage="cp936")
table.open(dbf.READ_WRITE)

		自动登录	找回密码
密码			立即注册

excel 转 dbf

浏览过的版块