configurations.py

import platform
import os

# the dataset name is created with the files names.
# if a dataset with same name is already in db will update the table without deleting and recreating it
update_table_if_exists = True

# the dataset name is created with the file name.
# if a dataset with same name is already in db will delete the table and replace it
# also notice that replacing table will make you lost all your dashboard with the target dataset,
# if you have active dashboards or charts that use the target dataset update instead of replacing.
# if update_table_if_exists is True this conf parameter will not be applied 
replace_table_if_exists = True

# true if delete file after creating a superset table (csv and eventually the json model)
delete_files_after_upload = False

# True if you want to print as debug all the queries
print_queries = True

# postgres superset db configurations 
host="127.0.0.1"        # host 
port=5432               # postgres port ( usually 5432 )
user="superset"         # your username
password="superset"     # your password
# when you create a new db in superset is only a logical entity. No real db correspond to the db created on superset
target_db="examples"    # db on wich upload dataset (you must create the db in superset first) (if you don't have a target db leave it blank)
superset_db="superset"  # the defalut superset db in wich superset store all metadata


# INTERNAL CONFIGURATIONS


# In this table superset will save a list of all the tables
superset_tables_name = 'tables'

# in this table superset will save a list of all the columns of all our tables
superset_table_columns_name = 'table_columns'


def get_log_file():
    log_dir_name = '.programmatically_upload_csv';
    log_file_name_fe = 'fe.log'
    log_file_name_be =  'be.log'

    log_file = None
    # Esegui azioni basate sul sistema operativo
    if platform.system() == 'Linux':
        log_file = os.path.join(os.path.expanduser('~'),log_dir_name ,log_file_name_be)
    elif platform.system() == 'Windows':
        log_file = os.path.join(os.path.expanduser('~'), 'Documents', log_dir_name,log_file_name_be )
    elif platform.system() == 'Darwin':
        log_file =   os.path.join(os.path.expanduser('~'), log_dir_name,log_file_name_be)

    print(log_file)
    with open(log_file, 'w') as file:
        pass

    return log_file


# IF YOU DON'T NEED A PARTICULAR CONFIGURATION FOR YOUR CSV SKIP THIS PART AND LEAVE AS IT IS
# if you have to configure some particular columns for your csv edit the fields you need 

# TABLES
# this conf are for the table 'tables' in superset that describe the new created table for a specific dataset
# if you need a specific cnfigurations for your table edit the static fields based on your need
def get_superset_tables_conf(table_name:str, database_id, table_id:str, uuid:str):
    
    # defalut values 
    row_values = {
        "created_on": 'now()',                              
        "changed_on": 'now()',
        "table_name": "'" + table_name +"'",
        "main_dttm_col": None,              
        "default_endpoint": None,               
        "database_id": str(database_id),
        "created_by_fk": 1,
        "changed_by_fk": 1,
        '"offset"': 0,
        "description": None,
        "is_featured": 'false',
        "cache_timeout": None,
        "schema": None,
        "sql": None,
        "params": None,
        "perm": "'[PostgreSQL].[" + table_name +"](id:" + str(table_id) +")'", 
        "filter_select_enabled": 'false',
        "fetch_values_predicate": None,
        "is_sqllab_view": 'false',
        "template_params": None,
        "schema_perm": None,
        "extra": None,
        "uuid": "'" + uuid  + "'"
    }


    return row_values;


# TBALE_COLUMNS
# this conf are for the table 'table_columns' in superset, that describe the columns of created table table
superset_table_columns_cols = [
    'created_on',
    'changed_on',
    'table_id',
    'column_name',
    'is_dttm',
    'is_active',
    'type',
    'groupby',
    'filterable',
    'description',
    'created_by_fk',
    'changed_by_fk',
    'expression',
    'verbose_name',
    'python_date_format',
    'uuid'
]


# TBALE_COLUMNS
# this conf are for the table table_columns in superset that describe each column for a specific dataset
# if you need a specific cnfigurations for your columns edit the static fields based on your need
def get_superset_table_columns_conf(table_id:int, column_name:str, data_type:str,uuid:str,is_dttm:str):

    # default values foreach row
    # you need to generate one row per each column of your dataset
    default_values = {
        superset_table_columns_cols[0]:'now()',
        superset_table_columns_cols[1]:'now()',
        superset_table_columns_cols[2]: table_id,
        superset_table_columns_cols[3]: "'" + column_name + "'",
        superset_table_columns_cols[4]: is_dttm,
        superset_table_columns_cols[5]: 'true',
        superset_table_columns_cols[6]: "'" + data_type + "'",
        superset_table_columns_cols[7]: 'true',
        superset_table_columns_cols[8]: 'true',
        superset_table_columns_cols[9]:  None ,
        superset_table_columns_cols[10]: 1,
        superset_table_columns_cols[11]: 1,
        superset_table_columns_cols[12]: None,
        superset_table_columns_cols[13]: None,
        superset_table_columns_cols[14]: None,
        superset_table_columns_cols[15]: "'" +  uuid  + "'"
    }

    return default_values


# global var (don't touch this)
csv_ext = '.csv'