[英]How to convert from csv to nested json dictionary ( A beginner )
我的結果:
[
{
"FIRST NAME": "JOHN",
"PRY SCHOOL": "OLIVETTE",
"HIGH SCHOOL": "BAPTIST",
"VEHICLEMAKE ": "TOYOTA",
"VEHICLE COL": "BLACK",
"TV MAKE": "SAMSUNG"
},
{
"FIRST NAME": "KOFI",
"PRY SCHOOL": "ACADAMY",
"HIGH SCHOOL": "MAYFLOWER",
"VEHICLEMAKE ": "HONDA",
"VEHICLE COL": "YELLOW",
"TV MAKE": "TECHWOOD"
},
{
"FIRST NAME": "BISI",
"PRY SCHOOL": "IGBOBI",
"HIGH SCHOOL": "ANGUS",
"VEHICLEMAKE ": "HYUNDAI",
"VEHICLE COL": "BLUE",
"TV MAKE": "THERMOC"
}
]
預期結果:
[
{
"FIRST NAME": "JOHN",
"SCHOOL": {
"primary": "OLIVETTE",
"HIGH SCHOOL": "BAPTIST"
},
"VEHICLE": {
"MAKE": "TOYOTA",
"COL": "BLACK"
},
"TV MAKE": "SAMSUNG"
},
{
"FIRST NAME": "KOFI",
"SCHOOL": {
"primary": "ACADAMY",
"HIGH SCHOOL": "MAYFLOWER"
},
"VEHICLE": {
"MAKE": "HONDA",
"COL": "YELLOW"
},
"TV MAKE": "TECHWOOD"
},
{
"FIRST NAME": "BISI",
"SCHOOL": {
"primary": "IGBOBI",
"HIGH SCHOOL": "ANGUS"
},
"VEHICLE": {
"MAKE": "HYUNDAI",
"COL": "BLUE"
},
"TV MAKE": "THERMO"
}
]
我的代碼:
import csv
import json
filenames = 'csvfilepath.csv'
my_dic = []
with open(filenames, encoding='utf-8') as csv_file:
csv_reader = csv.DictReader(csv_file)
for row in csv_reader:
my_dic.append(row)
with open('jasonfilepath.json', 'w', encoding='utf-8') as file_object:
json.dump(my_dic, file_object ,indent = 4)
我的數據:
firstname PRY SCHOOL HIGH SCHOOL VEHICLEMAKE VEHICLECOL TVMAKE
JOHN OLIVETTE BAPTIST TOYOTA BLACK SAMSUNG
KOFI ACADAMY MAYFLOWER HONDA YELLOW TECHWOOD
BISI IGBOBI ANGUS HYUNDAI BLUE THERMO
注意:行數超過 1000 行
我想確保學校(包括小學和中學)和車輛(品牌和顏色)的嵌套結構
DictReader
無法讀取嵌套數據,您需要手動構建具有所需結構的字典。 對於這種情況,我將使用簡單的csv.reader
。
代碼:
import csv
import json
with open(r"csvfilepath.csv", newline="") as inp_f, \
open(r"jsonfilepath.json", "w") as out_f:
reader = csv.reader(inp_f, delimiter="\t")
next(reader) # skip header
my_dic = []
for row in reader:
if len(row) >= 6: # skip rows which missing columns
my_dic.append({
"FIRST NAME": row[0],
"SCHOOL": {
"primary": row[1],
"HIGH SCHOOL": row[2]
},
"VEHICLE": {
"MAKE": row[3],
"COL": row[4]
},
"TV MAKE": row[5]
})
if my_dic: # if my_dic is not empty
json.dump(my_dic, out_f, indent=4)
類似於下面的內容(您確定“TV MAKE”位置嗎?)
data = [ { "FIRST NAME": "JOHN", "PRY SCHOOL": "OLIVETTE", "HIGH SCHOOL": "BAPTIST", "VEHICLEMAKE ": "TOYOTA", "VEHICLE COL": "BLACK", "TV MAKE": "SAMSUNG" }, { "FIRST NAME": "KOFI", "PRY SCHOOL": "ACADAMY", "HIGH SCHOOL": "MAYFLOWER", "VEHICLEMAKE ": "HONDA", "VEHICLE COL": "YELLOW", "TV MAKE": "TECHWOOD" }, { "FIRST NAME": "BISI", "PRY SCHOOL": "IGBOBI", "HIGH SCHOOL": "ANGUS", "VEHICLEMAKE ": "HYUNDAI", "VEHICLE COL": "BLUE", "TV MAKE": "THERMOC" } ]
new = [{'SCHOOL':{'PRIMARY':d['PRY SCHOOL'],'HIGH SCHOOL':d['HIGH SCHOOL']},'VEHICLE':{'MAKE':d['VEHICLEMAKE '],'COL':d['VEHICLE COL']},'FIRST NAME':d['FIRST NAME'],'TV MAKE':d['TV MAKE']} for d in data]
print(new)
輸出
[{'SCHOOL': {'PRIMARY': 'OLIVETTE', 'HIGH SCHOOL': 'BAPTIST'}, 'VEHICLE': {'MAKE': 'TOYOTA', 'COL': 'BLACK'}, 'FIRST NAME': 'JOHN', 'TV MAKE': 'SAMSUNG'}, {'SCHOOL': {'PRIMARY': 'ACADAMY', 'HIGH SCHOOL': 'MAYFLOWER'}, 'VEHICLE': {'MAKE': 'HONDA', 'COL': 'YELLOW'}, 'FIRST NAME': 'KOFI', 'TV MAKE': 'TECHWOOD'}, {'SCHOOL': {'PRIMARY': 'IGBOBI', 'HIGH SCHOOL': 'ANGUS'}, 'VEHICLE': {'MAKE': 'HYUNDAI', 'COL': 'BLUE'}, 'FIRST NAME': 'BISI', 'TV MAKE': 'THERMOC'}]
假設使用制表符分隔的輸入文件,您可以在讀取輸入文件時通過稍微修改邏輯來構建嵌套:
with open(filenames, encoding='utf-8') as csv_file:
csv_reader = csv.DictReader(csv_file, delimiter="\t")
for row in csv_reader:
my_dic.append({"FIRST NAME": row['firstname'],
"SCHOOL" : { "PRIMARY": row['PRY SCHOOL'],
"HIGH SCHOOL" : row['HIGH SCHOOL']},
"VEHICLE" : { "MAKE": row['VEHICLEMAKE'],
"COL": row['VEHICLECOL']},
"TV MAKE" : row["TVMAKE"]})
聲明:本站的技術帖子網頁,遵循CC BY-SA 4.0協議,如果您需要轉載,請注明本站網址或者原文地址。任何問題請咨詢:yoyou2525@163.com.