@@ -194,6 +194,7 @@ def sanitize_dataframe_columns_names(
194
194
How to handle duplicate columns. Can be "warn" or "drop" or "rename".
195
195
The default is "warn". "drop" will drop all but the first duplicated column.
196
196
"rename" will rename all duplicated columns with an incremental number.
197
+
197
198
Returns
198
199
-------
199
200
pandas.DataFrame
@@ -202,13 +203,18 @@ def sanitize_dataframe_columns_names(
202
203
Examples
203
204
--------
204
205
>>> import awswrangler as wr
205
- >>> df_normalized = wr.catalog.sanitize_dataframe_columns_names(df=pd.DataFrame({'A': [1, 2]}))
206
- >>> df_normalized_drop = wr.catalog.sanitize_dataframe_columns_names(df=pd.DataFrame({'A': [1, 2], 'a': [3, 4]}), handle_duplicate_columns="drop")
207
- >>> df_normalized_rename = wr.catalog.sanitize_dataframe_columns_names(df=pd.DataFrame({'A': [1, 2], 'a': [3, 4], 'a_1': [4, 6]}), handle_duplicate_columns="rename")
206
+ >>> df_normalized = wr.catalog.sanitize_dataframe_columns_names(df=pd.DataFrame({"A": [1, 2]}))
207
+ >>> df_normalized_drop = wr.catalog.sanitize_dataframe_columns_names(
208
+ df=pd.DataFrame({"A": [1, 2], "a": [3, 4]}), handle_duplicate_columns="drop"
209
+ )
210
+ >>> df_normalized_rename = wr.catalog.sanitize_dataframe_columns_names(
211
+ df=pd.DataFrame({"A": [1, 2], "a": [3, 4], "a_1": [4, 6]}), handle_duplicate_columns="rename"
212
+ )
213
+
208
214
"""
209
215
df .columns = [sanitize_column_name (x ) for x in df .columns ]
210
216
df .index .names = [None if x is None else sanitize_column_name (x ) for x in df .index .names ]
211
- if len (set (df .columns )) != len (df .columns ): # df.columns.duplicated().any():
217
+ if len (set (df .columns )) != len (df .columns ):
212
218
if handle_duplicate_columns == "warn" :
213
219
warnings .warn (
214
220
"Some columns names are duplicated, consider using `handle_duplicate_columns='[drop|rename]'`" ,
0 commit comments