mail@pastecode.io avatarunknown
12 days ago
2.1 kB
import pandas as pd

# Define your primary query
primary_query = f"SELECT * FROM {schema_ppm}.etl_ppm_replication_master WHERE eprm_catalog='SC' AND eprm_enabled_flg='Y'"

# Execute the primary query and get the primary dataframe
primary_df = pd.read_sql(primary_query, con=connection_ppm)

# Iterate through the primary dataframe
for index, row in primary_df.iterrows():
    # Get the table name from the 'eprm_table_name' column
    table_name = row['eprm_table_name']
    # Create source and target queries
    source_query = f"SELECT * FROM {schema_source}.{table_name}"
    target_query = f"SELECT * FROM {schema_ext}.{table_name}"
    # Execute source and target queries to get dataframes
    source_df = pd.read_sql(source_query, connection_source)
    target_df = pd.read_sql(target_query, connection_ext)
    # Merge dataframes to find differences
    merged_df = source_df.merge(target_df, on=row['eprm_table_col_pk'], how='outer', suffixes=('_source', '_target'), indicator=True)
    # Filter for rows with differences
    differences = merged_df[merged_df['_merge'] != 'both'].drop('_merge', axis=1)
    # Iterate through the differences
    for index, diff_row in differences.iterrows():
        # Construct the dynamic update statement
        update_columns = []
        for column_name, (source_val, target_val) in diff_row.items():
            if source_val != target_val:
                update_columns.append(f"{column_name}_target = '{source_val}'")
        # Get the primary key and its value
        pk_column_name = row['eprm_table_col_pk']
        pk_value = diff_row[pk_column_name + '_source']
        # Construct the WHERE condition
        where_condition = f"WHERE {pk_column_name} = '{pk_value}'"
        # Construct the dynamic update query
        update_query = f"UPDATE {schema_ext}.{table_name} SET {', '.join(update_columns)} {where_condition}"
        # Execute the update query to update the differing record in the target
        # Be sure to execute this query using your database connection

# End of loop