justinhchae · March 14, 2021 17:49 · justinhchae · Mar 14, 2021 · justinhchae · Mar 14, 2021
diff --git a/config.py b/config.py
 def get_vars_main(filename):
    """
    a helper function for creating the code for the main table of an sql alchemy schema
    bases on a csv file, extract necessary column names and tables and print the code to terminal
    copy and paste the code into the schema section
    """
    logging.info('get_vars_main() Producing code to make main data table in alchemy.')

    class_name = f'class {db_table_name.title()}({db_class_name}):'
    full_path = os.sep.join([data_folder, filename])
    data = pd.read_csv(full_path)
    cols = []

    # return a tuple of col name and col dtype
    for col in data.columns:
        col_type = data[col].dtype
        cols.append((col, col_type))

    def c_type(x):
        # hard code dtypes but expand to more types later
        return "Integer" if 'int' in str(x) else "String" if "object" in str(x) else "String"

    def p_type(x):
        # make primary key if 'id'
        return ", primary_key=True" if 'id' in str(x) else ""

    def k_type(x):
        # return data tables as a dict instead of tuple for referencing
        code_dict = dict((code, description) for code, description in cols_to_normalize)
        # return formatted string as camel case to match sql schema
        if x in code_dict.keys():
            z = code_dict[x]
            z = z.replace("_", ' ')
            z1, z2 = z.split(' ')
            z2 = z2.title()
            z = ''.join([z1,z2])
            z = '.'.join([z, x])
        else:
            z = ''

        return f', ForeignKey("{z}")' if any(x == col for col, descr in cols_to_normalize) else ''

    column_variables = [(f"{col_name} = Column({c_type(col_type)}{p_type(col_name)}{k_type(col_name)})") for
                        col_name, col_type in cols]

    def r_type(x):
        # format the table name as title-camel case
        x = x.replace("_", " ")
        x = x.title()
        x = x.replace(" ", "")
        return x

    relationship_variables = [
        f'{description}=relationship("{r_type(description)}", back_populates="main", uselist=True)' for
        code, description in cols_to_normalize]

    # Print the values out as code to copy and paste as schema
    print('# Main Table - Copy and Paste this class into db_schema.')
    print(class_name)
    print(f'\t__tablename__ = "{db_table_name}"')
    print('\t' + '\n\t'.join(column_variables))
    print()
    print('\t# These are for linking tables via relationships')
    print('\t' + '\n\t'.join(relationship_variables))
    print('\t# This is the end of the class code')

    #TODO: automate the side tables
    """
    class SectionDescription(BudgetDB.base):
    __tablename__ = "sectionDescription"
    section_code = Column(String, primary_key=True)
    section_description = Column(String)
    main = relationship("Budget2021", back_populates="section_description", uselist=True)
    """
	def get_vars_main(filename):
	"""
	a helper function for creating the code for the main table of an sql alchemy schema
	bases on a csv file, extract necessary column names and tables and print the code to terminal
	copy and paste the code into the schema section
	"""
	logging.info('get_vars_main() Producing code to make main data table in alchemy.')

	class_name = f'class {db_table_name.title()}({db_class_name}):'
	full_path = os.sep.join([data_folder, filename])
	data = pd.read_csv(full_path)
	cols = []

	# return a tuple of col name and col dtype
	for col in data.columns:
	col_type = data[col].dtype
	cols.append((col, col_type))

	def c_type(x):
	# hard code dtypes but expand to more types later
	return "Integer" if 'int' in str(x) else "String" if "object" in str(x) else "String"

	def p_type(x):
	# make primary key if 'id'
	return ", primary_key=True" if 'id' in str(x) else ""

	def k_type(x):
	# return data tables as a dict instead of tuple for referencing
	code_dict = dict((code, description) for code, description in cols_to_normalize)
	# return formatted string as camel case to match sql schema
	if x in code_dict.keys():
	z = code_dict[x]
	z = z.replace("_", ' ')
	z1, z2 = z.split(' ')
	z2 = z2.title()
	z = ''.join([z1,z2])
	z = '.'.join([z, x])
	else:
	z = ''

	return f', ForeignKey("{z}")' if any(x == col for col, descr in cols_to_normalize) else ''

	column_variables = [(f"{col_name} = Column({c_type(col_type)}{p_type(col_name)}{k_type(col_name)})") for
	col_name, col_type in cols]

	def r_type(x):
	# format the table name as title-camel case
	x = x.replace("_", " ")
	x = x.title()
	x = x.replace(" ", "")
	return x

	relationship_variables = [
	f'{description}=relationship("{r_type(description)}", back_populates="main", uselist=True)' for
	code, description in cols_to_normalize]

	# Print the values out as code to copy and paste as schema
	print('# Main Table - Copy and Paste this class into db_schema.')
	print(class_name)
	print(f'\t__tablename__ = "{db_table_name}"')
	print('\t' + '\n\t'.join(column_variables))
	print()
	print('\t# These are for linking tables via relationships')
	print('\t' + '\n\t'.join(relationship_variables))
	print('\t# This is the end of the class code')

	#TODO: automate the side tables
	"""
	class SectionDescription(BudgetDB.base):
	__tablename__ = "sectionDescription"
	section_code = Column(String, primary_key=True)
	section_description = Column(String)
	main = relationship("Budget2021", back_populates="section_description", uselist=True)
	"""