|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from abc import ABC |
|
import re |
|
import pandas as pd |
|
import pymysql |
|
import psycopg2 |
|
from agent.component.base import ComponentBase, ComponentParamBase |
|
|
|
|
|
class ExeSQLParam(ComponentParamBase): |
|
""" |
|
Define the ExeSQL component parameters. |
|
""" |
|
|
|
def __init__(self): |
|
super().__init__() |
|
self.db_type = "mysql" |
|
self.database = "" |
|
self.username = "" |
|
self.host = "" |
|
self.port = 3306 |
|
self.password = "" |
|
self.loop = 3 |
|
self.top_n = 30 |
|
|
|
def check(self): |
|
self.check_valid_value(self.db_type, "Choose DB type", ['mysql', 'postgresql', 'mariadb']) |
|
self.check_empty(self.database, "Database name") |
|
self.check_empty(self.username, "database username") |
|
self.check_empty(self.host, "IP Address") |
|
self.check_positive_integer(self.port, "IP Port") |
|
self.check_empty(self.password, "Database password") |
|
self.check_positive_integer(self.top_n, "Number of records") |
|
if self.database == "rag_flow": |
|
if self.host == "ragflow-mysql": raise ValueError("The host is not accessible.") |
|
if self.password == "infini_rag_flow": raise ValueError("The host is not accessible.") |
|
|
|
|
|
class ExeSQL(ComponentBase, ABC): |
|
component_name = "ExeSQL" |
|
|
|
def _run(self, history, **kwargs): |
|
if not hasattr(self, "_loop"): |
|
setattr(self, "_loop", 0) |
|
if self._loop >= self._param.loop: |
|
self._loop = 0 |
|
raise Exception("Maximum loop time exceeds. Can't query the correct data via SQL statement.") |
|
self._loop += 1 |
|
|
|
ans = self.get_input() |
|
ans = "".join(ans["content"]) if "content" in ans else "" |
|
ans = re.sub(r'^.*?SELECT ', 'SELECT ', repr(ans), flags=re.IGNORECASE) |
|
ans = re.sub(r';.*?SELECT ', '; SELECT ', ans, flags=re.IGNORECASE) |
|
ans = re.sub(r';[^;]*$', r';', ans) |
|
if not ans: |
|
raise Exception("SQL statement not found!") |
|
|
|
if self._param.db_type in ["mysql", "mariadb"]: |
|
db = pymysql.connect(db=self._param.database, user=self._param.username, host=self._param.host, |
|
port=self._param.port, password=self._param.password) |
|
elif self._param.db_type == 'postgresql': |
|
db = psycopg2.connect(dbname=self._param.database, user=self._param.username, host=self._param.host, |
|
port=self._param.port, password=self._param.password) |
|
|
|
try: |
|
cursor = db.cursor() |
|
except Exception as e: |
|
raise Exception("Database Connection Failed! \n" + str(e)) |
|
sql_res = [] |
|
for single_sql in re.split(r';', ans.replace(r"\n", " ")): |
|
if not single_sql: |
|
continue |
|
try: |
|
cursor.execute(single_sql) |
|
if cursor.rowcount == 0: |
|
sql_res.append({"content": "\nTotal: 0\n No record in the database!"}) |
|
continue |
|
single_res = pd.DataFrame([i for i in cursor.fetchmany(size=self._param.top_n)]) |
|
single_res.columns = [i[0] for i in cursor.description] |
|
sql_res.append({"content": "\nTotal: " + str(cursor.rowcount) + "\n" + single_res.to_markdown()}) |
|
except Exception as e: |
|
sql_res.append({"content": "**Error**:" + str(e) + "\nError SQL Statement:" + single_sql}) |
|
pass |
|
db.close() |
|
|
|
if not sql_res: |
|
return ExeSQL.be_output("") |
|
|
|
return pd.DataFrame(sql_res) |
|
|