Spaces:

Uunan
/

DeeDe

Sleeping

App Files Files Community

Uunan commited on Nov 15

Commit

0a39ef8

verified ·

1 Parent(s): acf4607

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -16

app.py CHANGED Viewed

@@ -4,17 +4,17 @@ from llama_cpp import Llama
 import gradio as gr
 # -----------------------------
-# 1) AYARLAR
 # -----------------------------
-MODEL_REPO = "Qwen/Qwen2.5-3B-Instruct-GGUF"   # 3B model
-MODEL_FILE = "qwen2.5-3b-instruct-q4_k_m.gguf"  # GGUF dosyası
 MODEL_DIR = "data"
 MODEL_PATH = os.path.join(MODEL_DIR, MODEL_FILE)
 os.makedirs(MODEL_DIR, exist_ok=True)
 # -----------------------------
-# 2) MODELİ İNDİR (EĞER YOKSA)
 # -----------------------------
 if not os.path.exists(MODEL_PATH):
     print("🔽 Model indiriliyor...")
@@ -25,37 +25,45 @@ if not os.path.exists(MODEL_PATH):
     )
     print("✅ Model indirildi:", downloaded_path)
 else:
-    print("⚡ Model zaten mevcut, tekrar indirilmeyecek.")
 # -----------------------------
-# 3) MODELİ YÜKLE
 # -----------------------------
 print("⏳ Model yükleniyor...")
 llm = Llama(
     model_path=MODEL_PATH,
     n_ctx=4096,
-    n_threads=4,     # CPU ortamı için ideal
-    n_gpu_layers=0   # HF Space Zero GPU için zorunlu
 )
 print("✅ Model yüklendi!")
 # -----------------------------
-# 4) FONKSİYON
 # -----------------------------
 def chat(prompt):
-    output = llm(prompt, max_tokens=300, temperature=0.7)
-    return output["choices"][0]["text"]
 # -----------------------------
-# 5) GRADIO ARAYÜZÜ
 # -----------------------------
 demo = gr.Interface(
     fn=chat,
     inputs=gr.Textbox(label="Soru"),
     outputs=gr.Textbox(label="Cevap"),
-    title="Qwen 3B Instruct (GGUF - llama.cpp)"
 )
-demo.launch(ssr_mode=False, share=True)

 import gradio as gr
 # -----------------------------
+# MODEL AYARLARI
 # -----------------------------
+MODEL_REPO = "Qwen/Qwen2.5-3B-Instruct-GGUF"
+MODEL_FILE = "qwen2.5-3b-instruct-q4_k_m.gguf"
 MODEL_DIR = "data"
 MODEL_PATH = os.path.join(MODEL_DIR, MODEL_FILE)
 os.makedirs(MODEL_DIR, exist_ok=True)
 # -----------------------------
+# MODEL İNDİR (YOKSA)
 # -----------------------------
 if not os.path.exists(MODEL_PATH):
     print("🔽 Model indiriliyor...")
     )
     print("✅ Model indirildi:", downloaded_path)
 else:
+    print("⚡ Model zaten mevcut, indirme atlandı.")
 # -----------------------------
+# MODEL YÜKLE
 # -----------------------------
 print("⏳ Model yükleniyor...")
 llm = Llama(
     model_path=MODEL_PATH,
     n_ctx=4096,
+    n_threads=4,
+    n_gpu_layers=0
 )
 print("✅ Model yüklendi!")
 # -----------------------------
+# CHAT ÇALIŞTIR
 # -----------------------------
 def chat(prompt):
+    out = llm(prompt, max_tokens=300, temperature=0.7)
+    return out["choices"][0]["text"]
 # -----------------------------
+# GRADIO ARAYÜZÜ (HF PRIVATE MODE UYUMLU)
 # -----------------------------
 demo = gr.Interface(
     fn=chat,
     inputs=gr.Textbox(label="Soru"),
     outputs=gr.Textbox(label="Cevap"),
+    title="Qwen 3B Instruct (GGUF - Private HF Space)"
 )
+# ❗ HuggingFace PRIVATE mod için kritik ayar:
+demo.launch(
+    server_name="0.0.0.0",
+    server_port=7860,
+    show_error=True,
+    share=False,       # PRIVATE SPACE olduğunda zorunlu
+    ssr_mode=False,    # Node.js çakışmasını çözer
+    inbrowser=False    # HF iframe preview uyumlu
+)