1- from .utilities import create_file_object , df_generator , logger , cast_pandas
2- from ._base_copy import BaseCopy
31import pandas as pd
2+ from .utilities import create_file_object , df_generator , cast_pandas
3+ from ._base_copy import BaseCopy
44
55
66class HDFTableCopy (BaseCopy ):
@@ -90,33 +90,35 @@ def hdf_to_pg(self, data_formatters=[cast_pandas], data_formatter_kwargs={}):
9090 data_formatter_kwargs: list of kwargs to pass to data_formatters functions
9191 """
9292 if self .hdf_tables is None :
93- logger .warn ("No HDF table found for SQL table {}" .format (self .sql_table ))
93+ self .logger .warn (
94+ "No HDF table found for SQL table {}" .format (self .sql_table )
95+ )
9496 return
9597
9698 for hdf_table in self .hdf_tables :
97- logger .info ("*** {} ***" .format (hdf_table ))
99+ self . logger .info ("*** {} ***" .format (hdf_table ))
98100
99- logger .info ("Reading HDF table" )
101+ self . logger .info ("Reading HDF table" )
100102 df = pd .read_hdf (self .file_name , key = hdf_table )
101103 self .rows += len (df )
102104
103105 data_formatter_kwargs ["hdf_table" ] = hdf_table
104- logger .info ("Formatting data" )
106+ self . logger .info ("Formatting data" )
105107 df = self .data_formatting (
106108 df , functions = data_formatters , ** data_formatter_kwargs
107109 )
108110
109- logger .info ("Creating generator for chunking dataframe" )
110- for chunk in df_generator (df , self .csv_chunksize ):
111+ self . logger .info ("Creating generator for chunking dataframe" )
112+ for chunk in df_generator (df , self .csv_chunksize , logger = self . logger ):
111113
112- logger .info ("Creating CSV in memory" )
114+ self . logger .info ("Creating CSV in memory" )
113115 fo = create_file_object (chunk )
114116
115- logger .info ("Copying chunk to database" )
117+ self . logger .info ("Copying chunk to database" )
116118 self .copy_from_file (fo )
117119 del fo
118120 del df
119- logger .info ("All chunks copied ({} rows)" .format (self .rows ))
121+ self . logger .info ("All chunks copied ({} rows)" .format (self .rows ))
120122
121123
122124class SmallHDFTableCopy (HDFTableCopy ):
@@ -136,29 +138,29 @@ def hdf_to_pg(self, data_formatters=[cast_pandas], data_formatter_kwargs={}):
136138 data_formatter_kwargs: list of kwargs to pass to data_formatters functions
137139 """
138140 if self .hdf_tables is None :
139- logger .warn ("No HDF table found for SQL table {self.sql_table}" )
141+ self . logger .warn ("No HDF table found for SQL table {self.sql_table}" )
140142 return
141143
142144 for hdf_table in self .hdf_tables :
143- logger .info ("*** {} ***" .format (hdf_table ))
144- logger .info ("Reading HDF table" )
145+ self . logger .info ("*** {} ***" .format (hdf_table ))
146+ self . logger .info ("Reading HDF table" )
145147 df = pd .read_hdf (self .file_name , key = hdf_table )
146148 self .rows += len (df )
147149
148150 data_formatter_kwargs ["hdf_table" ] = hdf_table
149- logger .info ("Formatting data" )
151+ self . logger .info ("Formatting data" )
150152 df = self .data_formatting (
151153 df , functions = data_formatters , ** data_formatter_kwargs
152154 )
153155
154- logger .info ("Creating CSV in memory" )
156+ self . logger .info ("Creating CSV in memory" )
155157 fo = create_file_object (df )
156158
157- logger .info ("Copying table to database" )
159+ self . logger .info ("Copying table to database" )
158160 self .copy_from_file (fo )
159161 del df
160162 del fo
161- logger .info ("All chunks copied ({} rows)" .format (self .rows ))
163+ self . logger .info ("All chunks copied ({} rows)" .format (self .rows ))
162164
163165
164166class BigHDFTableCopy (HDFTableCopy ):
@@ -181,11 +183,13 @@ def hdf_to_pg(self, data_formatters=[cast_pandas], data_formatter_kwargs={}):
181183 data_formatter_kwargs: list of kwargs to pass to data_formatters functions
182184 """
183185 if self .hdf_tables is None :
184- logger .warn ("No HDF table found for SQL table {}" .format (self .sql_table ))
186+ self .logger .warn (
187+ "No HDF table found for SQL table {}" .format (self .sql_table )
188+ )
185189 return
186190
187191 for hdf_table in self .hdf_tables :
188- logger .info ("*** {} ***" .format (hdf_table ))
192+ self . logger .info ("*** {} ***" .format (hdf_table ))
189193
190194 with pd .HDFStore (self .file_name ) as store :
191195 nrows = store .get_storer (hdf_table ).nrows
@@ -199,26 +203,28 @@ def hdf_to_pg(self, data_formatters=[cast_pandas], data_formatter_kwargs={}):
199203 start = 0
200204
201205 for i in range (n_chunks ):
202- logger .info ("*** HDF chunk {i} of {n} ***" .format (i = i + 1 , n = n_chunks ))
203- logger .info ("Reading HDF table" )
206+ self .logger .info (
207+ "*** HDF chunk {i} of {n} ***" .format (i = i + 1 , n = n_chunks )
208+ )
209+ self .logger .info ("Reading HDF table" )
204210 stop = min (start + self .hdf_chunksize , nrows )
205211 df = pd .read_hdf (self .file_name , key = hdf_table , start = start , stop = stop )
206212
207213 start += self .hdf_chunksize
208214
209215 data_formatter_kwargs ["hdf_table" ] = hdf_table
210- logger .info ("Formatting data" )
216+ self . logger .info ("Formatting data" )
211217 df = self .data_formatting (
212218 df , functions = data_formatters , ** data_formatter_kwargs
213219 )
214220
215- logger .info ("Creating generator for chunking dataframe" )
216- for chunk in df_generator (df , self .csv_chunksize ):
217- logger .info ("Creating CSV in memory" )
221+ self . logger .info ("Creating generator for chunking dataframe" )
222+ for chunk in df_generator (df , self .csv_chunksize , logger = self . logger ):
223+ self . logger .info ("Creating CSV in memory" )
218224 fo = create_file_object (chunk )
219225
220- logger .info ("Copying chunk to database" )
226+ self . logger .info ("Copying chunk to database" )
221227 self .copy_from_file (fo )
222228 del fo
223229 del df
224- logger .info ("All chunks copied ({} rows)" .format (self .rows ))
230+ self . logger .info ("All chunks copied ({} rows)" .format (self .rows ))
0 commit comments