数据清洗与格式转换全能工具,让脏数据变干净、杂格式变统一。
python3 scripts/data_ops.py convert data.csv --to json -o data.json
python3 scripts/data_ops.py convert data.xlsx --to csv -o data.csv
python3 scripts/data_ops.py convert data.json --to yaml -o data.yaml
python3 scripts/data_ops.py fix-encoding data.csv --target-encoding utf-8 -o fixed.csv
python3 scripts/data_ops.py clean data.csv --dedup --trim --fill-na "N/A" --normalize-space -o cleaned.csv
python3 scripts/data_ops.py regex data.csv --column "备注" --pattern "手机号: (\d{11})" --extract -o phones.csv
python3 scripts/data_ops.py rename-cols data.csv --mapping '{"姓名": "name", "年龄": "age"}' -o renamed.csv
python3 scripts/data_ops.py validate data.csv --column "邮箱" --type email --report validation.json
python3 scripts/data_ops.py batch-convert ./data_dir/ --from csv --to json --output-dir ./json_output/
pip install pandas openpyxl pyyaml chardet
共 1 个版本