gas_groupby, electricity_groupby join

ewillwin·2022년 7월 28일
0

TSMtech Record

목록 보기
16/39
import chunk
from typing import final
from venv import create
import pandas as pd
from sqlalchemy import create_engine
import warnings
#-*- coding: cp949 -*-

Chunksize = 1000000
warnings.simplefilter(action='ignore', category=FutureWarning)

gas = pd.read_csv("C:/Users/TSM/gas_groupby.csv",sep =',',encoding='utf-8',names=['date','addr','gas','count'],header=0,low_memory=False)
gas = gas.astype({'date':'str','addr':'str','gas':'int','count':'int'})
gas = gas.sort_values(by=['date','addr'])
gas.drop(['count'], axis=1, inplace=True)

electricity = pd.read_csv("C:/Users/TSM/electricity_groupby.csv",sep =',',encoding='utf-8',names=['date','addr','electricity','count'],header=0,low_memory=False)
electricity = electricity.astype({'date':'str','addr':'str','electricity':'int','count':'int'})
electricity = electricity.sort_values(by=['date','addr'])

df = pd.merge(left=electricity, right=gas, how='left', on=['date','addr'])
df = df[['date','addr','electricity','gas','count']]
df = df.astype({'date':'str','addr':'str','electricity':'int','gas':'int','count':'int'}, errors='ignore')
print(df)
df.to_csv("buildingenergy.csv", mode='a', index=False, header=None)
  • gas 소비량이 left join할 때 NaN값 때문에 float type으로 처리됨
profile
Software Engineer @ LG Electronics

0개의 댓글