|
| 1 | +-- Assume that materialize_mig_view.sql has been executed already. |
| 2 | +-- This view allows comparing two MIG versions to find added, deleted, and modified rows. |
| 3 | +-- |
| 4 | +-- IMPORTANT: This view produces a cross-product of all version pairs. You MUST filter by version and format. |
| 5 | +-- |
| 6 | +-- Usage for comparing FV2410 -> FV2504 for UTILTS format: |
| 7 | +-- SELECT * FROM v_mig_diff |
| 8 | +-- WHERE old_format_version = 'FV2410' |
| 9 | +-- AND old_format = 'UTILTS' |
| 10 | +-- AND new_format_version = 'FV2504' |
| 11 | +-- AND new_format = 'UTILTS' |
| 12 | +-- ORDER BY sort_path; |
| 13 | +-- |
| 14 | +-- diff_status can be: 'added', 'deleted', 'modified', 'unchanged' |
| 15 | +-- The view compares line_status_std, line_status_specification, and line_name to determine modifications. |
| 16 | +-- |
| 17 | +-- For deleted rows, old_ columns are populated and new_ columns are NULL. |
| 18 | +-- For added rows, new_ columns are populated and old_ columns are NULL. |
| 19 | +-- |
| 20 | +-- MATCHING STRATEGY: |
| 21 | +-- This view matches rows by their id_path column, which uses semantic qualifiers |
| 22 | +-- (e.g., "SG2>SG3>FTX+ACD>C_C107>D_4441>") to identify rows across versions. |
| 23 | +-- This is consistent with how the AHB diff view works. |
| 24 | +-- Note: SQLite's "IS NOT" is a NULL-safe inequality operator (equivalent to SQL standard "IS DISTINCT FROM") |
| 25 | + |
| 26 | +DROP TABLE IF EXISTS v_mig_diff; |
| 27 | +DROP VIEW IF EXISTS v_mig_diff; |
| 28 | + |
| 29 | +CREATE VIEW v_mig_diff AS |
| 30 | +WITH version_pairs AS (SELECT DISTINCT old_v.edifact_format_version AS old_format_version, |
| 31 | + old_v.format AS old_format, |
| 32 | + new_v.edifact_format_version AS new_format_version, |
| 33 | + new_v.format AS new_format |
| 34 | + FROM (SELECT DISTINCT edifact_format_version, format FROM mig_hierarchy_materialized) old_v |
| 35 | + JOIN (SELECT DISTINCT edifact_format_version, format |
| 36 | + FROM mig_hierarchy_materialized) new_v |
| 37 | + ON old_v.format = new_v.format |
| 38 | + WHERE old_v.edifact_format_version < new_v.edifact_format_version), |
| 39 | + |
| 40 | +-- Pre-compute changed_columns once, derive diff_status from it |
| 41 | + modified_check AS (SELECT TRIM( |
| 42 | + CASE |
| 43 | + WHEN old_tbl.line_status_std IS NOT new_tbl.line_status_std |
| 44 | + THEN 'line_status_std, ' |
| 45 | + ELSE '' END || |
| 46 | + CASE |
| 47 | + WHEN old_tbl.line_status_specification IS NOT new_tbl.line_status_specification |
| 48 | + THEN 'line_status_specification, ' |
| 49 | + ELSE '' END || |
| 50 | + CASE |
| 51 | + WHEN old_tbl.line_name IS NOT new_tbl.line_name |
| 52 | + THEN 'line_name' |
| 53 | + ELSE '' END |
| 54 | + , ', ') AS changed_columns, |
| 55 | + new_tbl.id_path AS id_path, |
| 56 | + new_tbl.sort_path AS sort_path, |
| 57 | + new_tbl.path AS path, |
| 58 | + new_tbl.type AS line_type, |
| 59 | + old_tbl.edifact_format_version AS old_format_version, |
| 60 | + old_tbl.format AS old_format, |
| 61 | + old_tbl.segmentgroup_id AS old_segmentgroup_id, |
| 62 | + old_tbl.segment_id AS old_segment_id, |
| 63 | + old_tbl.dataelement_id AS old_dataelement_id, |
| 64 | + old_tbl.code_value AS old_code_value, |
| 65 | + old_tbl.line_status_std AS old_line_status_std, |
| 66 | + old_tbl.line_status_specification AS old_line_status_specification, |
| 67 | + old_tbl.line_name AS old_line_name, |
| 68 | + new_tbl.edifact_format_version AS new_format_version, |
| 69 | + new_tbl.format AS new_format, |
| 70 | + new_tbl.segmentgroup_id AS new_segmentgroup_id, |
| 71 | + new_tbl.segment_id AS new_segment_id, |
| 72 | + new_tbl.dataelement_id AS new_dataelement_id, |
| 73 | + new_tbl.code_value AS new_code_value, |
| 74 | + new_tbl.line_status_std AS new_line_status_std, |
| 75 | + new_tbl.line_status_specification AS new_line_status_specification, |
| 76 | + new_tbl.line_name AS new_line_name |
| 77 | + FROM version_pairs vp |
| 78 | + JOIN mig_hierarchy_materialized new_tbl |
| 79 | + ON new_tbl.edifact_format_version = vp.new_format_version |
| 80 | + AND new_tbl.format = vp.new_format |
| 81 | + JOIN mig_hierarchy_materialized old_tbl |
| 82 | + ON old_tbl.edifact_format_version = vp.old_format_version |
| 83 | + AND old_tbl.format = vp.old_format |
| 84 | + AND old_tbl.id_path = new_tbl.id_path) |
| 85 | + |
| 86 | +-- Modified and unchanged rows |
| 87 | +SELECT CASE WHEN changed_columns != '' THEN 'modified' ELSE 'unchanged' END AS diff_status, |
| 88 | + NULLIF(changed_columns, '') AS changed_columns, |
| 89 | + id_path, |
| 90 | + sort_path, |
| 91 | + path, |
| 92 | + line_type, |
| 93 | + old_format_version, |
| 94 | + old_format, |
| 95 | + old_segmentgroup_id, |
| 96 | + old_segment_id, |
| 97 | + old_dataelement_id, |
| 98 | + old_code_value, |
| 99 | + old_line_status_std, |
| 100 | + old_line_status_specification, |
| 101 | + old_line_name, |
| 102 | + new_format_version, |
| 103 | + new_format, |
| 104 | + new_segmentgroup_id, |
| 105 | + new_segment_id, |
| 106 | + new_dataelement_id, |
| 107 | + new_code_value, |
| 108 | + new_line_status_std, |
| 109 | + new_line_status_specification, |
| 110 | + new_line_name |
| 111 | +FROM modified_check |
| 112 | + |
| 113 | +UNION ALL |
| 114 | + |
| 115 | +-- Added rows (exist in new but not in old for the specific version pair) |
| 116 | +SELECT 'added' AS diff_status, |
| 117 | + NULL AS changed_columns, |
| 118 | + new_tbl.id_path, |
| 119 | + new_tbl.sort_path, |
| 120 | + new_tbl.path, |
| 121 | + new_tbl.type AS line_type, |
| 122 | + vp.old_format_version AS old_format_version, |
| 123 | + vp.old_format AS old_format, |
| 124 | + NULL AS old_segmentgroup_id, |
| 125 | + NULL AS old_segment_id, |
| 126 | + NULL AS old_dataelement_id, |
| 127 | + NULL AS old_code_value, |
| 128 | + NULL AS old_line_status_std, |
| 129 | + NULL AS old_line_status_specification, |
| 130 | + NULL AS old_line_name, |
| 131 | + new_tbl.edifact_format_version AS new_format_version, |
| 132 | + new_tbl.format AS new_format, |
| 133 | + new_tbl.segmentgroup_id AS new_segmentgroup_id, |
| 134 | + new_tbl.segment_id AS new_segment_id, |
| 135 | + new_tbl.dataelement_id AS new_dataelement_id, |
| 136 | + new_tbl.code_value AS new_code_value, |
| 137 | + new_tbl.line_status_std AS new_line_status_std, |
| 138 | + new_tbl.line_status_specification AS new_line_status_specification, |
| 139 | + new_tbl.line_name AS new_line_name |
| 140 | +FROM version_pairs vp |
| 141 | + JOIN mig_hierarchy_materialized new_tbl |
| 142 | + ON new_tbl.edifact_format_version = vp.new_format_version |
| 143 | + AND new_tbl.format = vp.new_format |
| 144 | +WHERE NOT EXISTS (SELECT 1 |
| 145 | + FROM mig_hierarchy_materialized old_tbl |
| 146 | + WHERE old_tbl.edifact_format_version = vp.old_format_version |
| 147 | + AND old_tbl.format = vp.old_format |
| 148 | + AND old_tbl.id_path = new_tbl.id_path) |
| 149 | + |
| 150 | +UNION ALL |
| 151 | + |
| 152 | +-- Deleted rows (exist in old but not in new for the specific version pair) |
| 153 | +SELECT 'deleted' AS diff_status, |
| 154 | + NULL AS changed_columns, |
| 155 | + old_tbl.id_path, |
| 156 | + old_tbl.sort_path, |
| 157 | + old_tbl.path, |
| 158 | + old_tbl.type AS line_type, |
| 159 | + old_tbl.edifact_format_version AS old_format_version, |
| 160 | + old_tbl.format AS old_format, |
| 161 | + old_tbl.segmentgroup_id AS old_segmentgroup_id, |
| 162 | + old_tbl.segment_id AS old_segment_id, |
| 163 | + old_tbl.dataelement_id AS old_dataelement_id, |
| 164 | + old_tbl.code_value AS old_code_value, |
| 165 | + old_tbl.line_status_std AS old_line_status_std, |
| 166 | + old_tbl.line_status_specification AS old_line_status_specification, |
| 167 | + old_tbl.line_name AS old_line_name, |
| 168 | + vp.new_format_version AS new_format_version, |
| 169 | + vp.new_format AS new_format, |
| 170 | + NULL AS new_segmentgroup_id, |
| 171 | + NULL AS new_segment_id, |
| 172 | + NULL AS new_dataelement_id, |
| 173 | + NULL AS new_code_value, |
| 174 | + NULL AS new_line_status_std, |
| 175 | + NULL AS new_line_status_specification, |
| 176 | + NULL AS new_line_name |
| 177 | +FROM version_pairs vp |
| 178 | + JOIN mig_hierarchy_materialized old_tbl |
| 179 | + ON old_tbl.edifact_format_version = vp.old_format_version |
| 180 | + AND old_tbl.format = vp.old_format |
| 181 | +WHERE NOT EXISTS (SELECT 1 |
| 182 | + FROM mig_hierarchy_materialized new_tbl |
| 183 | + WHERE new_tbl.edifact_format_version = vp.new_format_version |
| 184 | + AND new_tbl.format = vp.new_format |
| 185 | + AND new_tbl.id_path = old_tbl.id_path); |
0 commit comments