Ma'lumotlar tahlilida turli fayl formatlari bilan ishlash muhim ko'nikma.
CSV fayllar
import pandas as pd
# O'qish
df = pd.read_csv('data.csv', encoding='utf-8')
# Yozish
df.to_csv('natija.csv', index=False, encoding='utf-8')
# Separator o'zgartirish
df = pd.read_csv('data.csv', sep=';')
Excel fayllar
pip install openpyxl
# O'qish
df = pd.read_excel('data.xlsx', sheet_name='Sheet1')
# Yozish
df.to_excel('natija.xlsx', index=False, sheet_name='Natija')
# Bir nechta varaq
with pd.ExcelWriter('hisobot.xlsx') as writer:
df1.to_excel(writer, sheet_name='Oy1')
df2.to_excel(writer, sheet_name='Oy2')
JSON fayllar
import json
# O'qish
with open('data.json', 'r', encoding='utf-8') as f:
data = json.load(f)
# Yozish
with open('natija.json', 'w', encoding='utf-8') as f:
json.dump(data, f, ensure_ascii=False, indent=2)
# Pandas bilan
df = pd.read_json('data.json')
df.to_json('natija.json', orient='records', force_ascii=False)
Bir nechta CSV ni birlashtirish
import glob
fayllar = glob.glob('data/*.csv')
df_list = [pd.read_csv(f) for f in fayllar]
df = pd.concat(df_list, ignore_index=True)