Spaces:
Running
Running
File size: 8,831 Bytes
6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 6039d0c 2b295d5 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 |
import os
import re
import logging
from flask import Flask, request, jsonify, Response
from flask_cors import CORS
from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
import torch
import psycopg2
import json
app = Flask(__name__)
CORS(app)
# --- إعداد السجل ---
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)
# --- إعداد النموذج ---
MODEL_NAME = "tscholak/cxmefzzi" # نموذج Text-to-SQL بديل
SUPABASE_DB_URL = "postgresql://postgres.mougnkvoyyhcuxeeqvmh:Xf5E0DhUvKEHEAqq@aws-0-eu-central-1.pooler.supabase.com:6543/postgres"
tokenizer = None
model = None
def initialize():
global tokenizer, model
# تحديد مسار ذاكرة مؤقتة ضمن المساحة المسموح بها
cache_dir = os.path.join(os.getcwd(), "model_cache")
os.makedirs(cache_dir, exist_ok=True)
device = "cuda" if torch.cuda.is_available() else "cpu"
logger.info(f"تحميل النموذج على الجهاز: {device}")
try:
tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, cache_dir=cache_dir)
model = AutoModelForSeq2SeqLM.from_pretrained(MODEL_NAME, cache_dir=cache_dir).to(device)
logger.info("تم تحميل النموذج بنجاح")
except Exception as e:
logger.error(f"فشل في تحميل النموذج: {str(e)}")
raise
initialize()
# --- سكيمة قاعدة البيانات ---
DB_SCHEMA = """
CREATE TABLE public.profiles (
id uuid NOT NULL,
updated_at timestamp with time zone,
username text UNIQUE CHECK (char_length(username) >= 3),
full_name text,
avatar_url text,
website text,
cam_mac text UNIQUE,
fcm_token text,
notification_enabled boolean DEFAULT true,
CONSTRAINT profiles_pkey PRIMARY KEY (id),
CONSTRAINT profiles_id_fkey FOREIGN KEY (id) REFERENCES auth.users(id)
);
CREATE TABLE public.place (
id bigint GENERATED ALWAYS AS IDENTITY NOT NULL,
created_at timestamp with time zone DEFAULT (now() AT TIME ZONE 'utc'::text),
name text,
CONSTRAINT place_pkey PRIMARY KEY (id)
);
CREATE TABLE public.user_place (
id bigint GENERATED ALWAYS AS IDENTITY NOT NULL,
created_at timestamp with time zone NOT NULL DEFAULT now(),
place_id bigint,
user_cam_mac text,
CONSTRAINT user_place_pkey PRIMARY KEY (id),
CONSTRAINT user_place_place_id_fkey FOREIGN KEY (place_id) REFERENCES public.place(id),
CONSTRAINT user_place_user_cam_mac_fkey FOREIGN KEY (user_cam_mac) REFERENCES public.profiles(cam_mac)
);
CREATE TABLE public.data (
id bigint GENERATED ALWAYS AS IDENTITY NOT NULL,
created_at timestamp without time zone,
caption text,
image_url text,
latitude double precision DEFAULT '36.1833854'::double precision,
longitude double precision DEFAULT '37.1309255'::double precision,
user_place_id bigint,
cam_mac text,
CONSTRAINT data_pkey PRIMARY KEY (id),
CONSTRAINT data_user_place_id_fkey FOREIGN KEY (user_place_id) REFERENCES public.user_place(id)
);
CREATE TABLE public.biodata (
id bigint GENERATED ALWAYS AS IDENTITY NOT NULL,
created_at timestamp with time zone NOT NULL DEFAULT now(),
mac_address text,
acceleration_x double precision,
acceleration_y double precision,
acceleration_z double precision,
gyro_x double precision,
gyro_y double precision,
gyro_z double precision,
temperature double precision,
CONSTRAINT biodata_pkey PRIMARY KEY (id),
CONSTRAINT biodata_mac_address_fkey FOREIGN KEY (mac_address) REFERENCES public.profiles(cam_mac)
);
CREATE TABLE public.notification (
id bigint GENERATED ALWAYS AS IDENTITY NOT NULL,
created_at timestamp without time zone NOT NULL DEFAULT now(),
user_cam_mac text,
title text,
message text,
is_read boolean,
acceleration_x double precision,
acceleration_y double precision,
acceleration_z double precision,
gyro_x double precision,
gyro_y double precision,
gyro_z double precision,
CONSTRAINT notification_pkey PRIMARY KEY (id),
CONSTRAINT notification_user_cam_mac_fkey FOREIGN KEY (user_cam_mac) REFERENCES public.profiles(cam_mac)
);
CREATE TABLE public.flag (
id bigint GENERATED ALWAYS AS IDENTITY NOT NULL,
flag smallint,
user_mac_address text,
CONSTRAINT flag_pkey PRIMARY KEY (id),
CONSTRAINT flag_user_mac_address_fkey FOREIGN KEY (user_mac_address) REFERENCES public.profiles(cam_mac)
);
""".strip()
# --- الاتصال بقاعدة البيانات ---
def get_db_connection():
try:
return psycopg2.connect(SUPABASE_DB_URL)
except Exception as err:
logger.error(f"Database connection error: {err}")
return None
# --- التحقق من صحة cam_mac ---
def validate_cam_mac(cam_mac):
conn = get_db_connection()
if not conn:
return False
try:
cursor = conn.cursor()
cursor.execute("SELECT 1 FROM profiles WHERE cam_mac = %s;", (cam_mac,))
return cursor.fetchone() is not None
except Exception as e:
logger.error(f"Validation error: {e}")
return False
finally:
if conn:
conn.close()
@app.route('/api/query', methods=['POST'])
def handle_query():
if tokenizer is None or model is None:
return jsonify({"error": "النموذج غير محمل، يرجى المحاولة لاحقاً"}), 503
try:
data = request.get_json()
if not data or 'text' not in data or 'cam_mac' not in data:
return jsonify({"error": "يرجى إرسال 'text' و 'cam_mac'"}), 400
natural_query = data['text']
cam_mac = data['cam_mac']
logger.info(f"استعلام من {cam_mac}: {natural_query}")
# التحقق من صحة cam_mac
if not validate_cam_mac(cam_mac):
return jsonify({"error": "عنوان MAC غير صالح"}), 403
prompt = f"""
### Postgres SQL table definitions
{DB_SCHEMA}
### Rules:
- Always filter by cam_mac = '{cam_mac}'
- Use only SELECT statements
- Use proper JOINs
- Use table aliases when helpful
- The output must contain only the SQL query
### User question: {natural_query}
### SQL query:
SELECT
""".strip()
inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
outputs = model.generate(**inputs, max_length=256)
sql = tokenizer.decode(outputs[0], skip_special_tokens=True)
# تنظيف الناتج
sql = re.sub(r"^```sql\s*", "", sql, flags=re.IGNORECASE)
sql = re.sub(r"\s*```$", "", sql)
sql = re.sub(r"^SQL:\s*", "", sql, flags=re.IGNORECASE)
if not sql.upper().startswith("SELECT"):
sql = "SELECT " + sql.split("SELECT")[-1] if "SELECT" in sql else f"SELECT * FROM ({sql}) AS subquery"
if not sql.endswith(";"):
sql += ";"
logger.info(f"استعلام SQL المولد: {sql}")
if not sql.upper().strip().startswith("SELECT"):
return jsonify({"error": "يُسمح فقط باستعلامات SELECT"}), 403
conn = get_db_connection()
if not conn:
return jsonify({"error": "فشل الاتصال بقاعدة البيانات"}), 500
cursor = None
try:
cursor = conn.cursor()
cursor.execute(sql)
columns = [desc[0] for desc in cursor.description]
rows = cursor.fetchall()
data = [dict(zip(columns, row)) for row in rows]
response_data = {
"data": data,
}
response_json = json.dumps(response_data, ensure_ascii=False)
return Response(
response_json,
status=200,
mimetype='application/json; charset=utf-8'
)
except Exception as e:
logger.error(f"خطأ في تنفيذ SQL: {e}")
return jsonify({"error": str(e), "generated_sql": sql}), 500
finally:
if cursor:
cursor.close()
if conn:
conn.close()
except Exception as e:
logger.error(f"خطأ في التوليد: {str(e)}")
return jsonify({"error": "فشل في توليد الاستعلام"}), 500
@app.route('/')
def home():
return """
<h1>Text2SQL API</h1>
<p>Use <code>/api/query</code> with POST {"text": "your question", "cam_mac": "device_mac_address"}.</p>
"""
if __name__ == '__main__':
app.run(host='0.0.0.0', port=7860) |