import csv
import json
import pandas as pd
csv_filename = 'tmdb_5000_movies.csv'
json_filename = 'tmdb_5000_movies.json'
def main():
csvfile = open(csv_filename, 'r', encoding='UTF-8')
jsonfile = open(json_filename, 'w', encoding='UTF-8')
dataframe = pd.read_csv(csv_filename, encoding='UTF-8')
# 獲取表頭
fieldnames = dataframe.columns
fieldnames = tuple(fieldnames)
# print(fieldnames)
reader = csv.DictReader(csvfile, fieldnames=fieldnames)
count01 = 0
for row in reader:
# 跳過第一行的標題
if count01 == 0:
count01 += 1
continue
# 確保每一行都能成功地解析
for k in row.keys():
# 如果表格中字段以是json數組,則將其轉換成python的list
if str(row[k]).startswith('['):
try:
row[k] = json.loads(row[k])
except:
# 該列表爲空
continue
# 寫入文件
json.dump(row, jsonfile, ensure_ascii=False)
jsonfile.write('\n')
jsonfile.close()
csvfile.close()
print("succees!")
if __name__ == '__main__':
main()
解析結果: