Github user kaknikhil commented on a diff in the pull request:
https://github.com/apache/madlib/pull/271#discussion_r191587755
--- Diff: src/madpack/madpack.py ---
@@ -131,10 +141,73 @@ def _get_relative_maddir(maddir, port):
return maddir
#
------------------------------------------------------------------------------
+def _cleanup_comments_in_sqlfile(output_filename, upgrade):
+ """
+ @brief Remove comments in the sql script
+ """
+ if not upgrade:
+ with open(output_filename, 'r+') as output_filehandle:
+ full_sql = output_filehandle.read()
+ pattern =
re.compile(r"""(/\*(.|[\r\n])*?\*/)|(--(.*|[\r\n]))""")
+ res = ''
+ lines = re.split(r'[\r\n]+', full_sql)
+ for line in lines:
+ tmp = line
+ if not tmp.strip().startswith("E'"):
+ line = re.sub(pattern, '', line)
+ res += line + '\n'
+ full_sql = res.strip()
+ full_sql = re.sub(pattern, '', full_sql).strip()
+ # Re-write the cleaned-up sql to a new file. Python does not let us
--- End diff --
can we move the new file creation and the renaming logic to a different
function? This way the function will have a single responsibility of just
cleaning the input.
---