#!/usr/bin/python
# -*- coding:utf-8 -*-
import json
import pandas as pd
import os
def file_name(file_path):
"""
获取每个文件的路径
root 为当前目录路径
dirs 为当前路径下所有子目录
files 为当前路径下所有非目录子文件
:param file_path:
:return:
"""
paths_list = []
for root,dirs,files in os.walk(file_path):
for file in files:
path_list = os.path.join(root,file)
paths_list.append(path_list)
return paths_list
def json_out(file_path):
"""
将json格式转换为xlsx格式
:param path:
:return:
"""
file = open(file_path, "r", encoding='utf-8')
data=[]
for line in file.readlines():
dic = json.loads(line)
data.append(dic)
data = pd.DataFrame(data)
data.to_excel(r"D:\rzj\newYelp\yelp_academic_dataset_user.xlsx", index=None)
if __name__ == '__main__':
file_path = r"C:\Users\Desktop\yelp_dataset\yelp_academic_dataset_user.json"
json_out(file_path)
参考资料: