diff --git a/AutomationScripts/SQL Parser/README.md b/AutomationScripts/SQL Parser/README.md new file mode 100644 index 000000000..b7083361f --- /dev/null +++ b/AutomationScripts/SQL Parser/README.md @@ -0,0 +1,45 @@ +## SQL Parser + +## Short description of package/script: +Extracts column names and tables used by the query. Automatically conduct column alias resolution, sub queries aliases resolution as well as tables aliases resolving. + +Provides also a helper for normalization of SQL queries. + +## List out the libraries imported: +```` +pip install sql-metadata +```` + +## Example extracting raw sql +## Input + +```sql +select id, name, sum(amount) as total_amt from schema.foo a +left join ( select id, name from schema.bar limit 10 ) b on a.id = b.id +-- left join schema_b.bars c on b.id = c.id +left join schema_b.foos c on b.id = c.id +group by id, name +limit 1000 +``` + +## Output + +### sql_parser.columns +```` +['id', 'name', 'amount', 'schema.foo.id', 'schema_b.foos.id'] +```` + +### sql_parser.tables +```` +['schema.foo', 'schema.bar', 'schema_b.foos'] +```` + +### sql_parser.columns_aliases +```` +{'total_amt': 'amount'} +```` + +### sql_parser.subqueries +```` +{'b': 'select id, name from schema.bar limit 10'} +```` diff --git a/AutomationScripts/SQL Parser/requirements.txt b/AutomationScripts/SQL Parser/requirements.txt new file mode 100644 index 000000000..507311cfc --- /dev/null +++ b/AutomationScripts/SQL Parser/requirements.txt @@ -0,0 +1 @@ +import sql-metadata \ No newline at end of file diff --git a/AutomationScripts/SQL Parser/sql_parser.py b/AutomationScripts/SQL Parser/sql_parser.py new file mode 100644 index 000000000..c836c33e6 --- /dev/null +++ b/AutomationScripts/SQL Parser/sql_parser.py @@ -0,0 +1,32 @@ +from sql_metadata import Parser + +rawsql = """ + select id, name, sum(amount) as total_amt from schema.foo a + left join ( select id, name from schema.bar limit 10 ) b on a.id = b.id + -- left join schema_b.bars c on b.id = c.id + left join schema_b.foos c on b.id = c.id + group by id, name + limit 1000 + """ + +# initial Parser +sql_parser = Parser(rawsql) + +# example sql_parser +sql_parser_columns = sql_parser.columns +print("## exact columns form sql") +print(sql_parser_columns) + +sql_parser_tables = sql_parser.tables +print("## exact schema and table form sql") +print(sql_parser_tables) + +sql_parser_columns_aliases = sql_parser.columns_aliases +print("## exact columns_aliases form sql") +print(sql_parser_columns_aliases) + +sql_parser_subqueries = sql_parser.subqueries +print("## exact subqueries form sql") +print(sql_parser_subqueries) + +