import re from typing import Union from colossalqa.mylogging import get_logger from sqlalchemy import Engine, MetaData, create_engine from sqlalchemy.exc import SQLAlchemyError from sqlalchemy.ext.declarative import declarative_base logger = get_logger() def drop_table(engine: Engine) -> None: """ Drop all existing table """ Base = declarative_base() metadata = MetaData() metadata.reflect(bind=engine) for key in metadata.tables: table = metadata.tables[key] if table is not None: Base.metadata.drop_all(engine, [table], checkfirst=True) def create_empty_sql_database(database_uri): try: # Create an SQLAlchemy engine to connect to the database engine = create_engine(database_uri) # Create the database engine.connect() logger.info(f"Database created at {database_uri}") except SQLAlchemyError as e: logger.error(f"Error creating database: {str(e)}") return engine, database_uri def destroy_sql_database(sql_engine: Union[Engine, str]) -> None: """ Destroy an sql database """ if isinstance(sql_engine, str): sql_engine = create_engine(sql_engine) drop_table(sql_engine) sql_engine.dispose() sql_engine = None def detect_lang_naive(s): """ Naive function for language detection, should be replaced by an independant layer """ remove_nota = "[’·°–!\"#$%&'()*+,-./:;<=>?@,。?★、…【】()《》?“”‘’![\\]^_`{|}~]+" s = re.sub(remove_nota, "", s) s = re.sub("[0-9]", "", s).strip() res = re.sub("[a-zA-Z]", "", s).strip() if len(res) <= 0: return "en" else: return "zh"