Spaces:
Running
on
Zero
Running
on
Zero
UPDATE
Browse files
app.py
CHANGED
@@ -38,7 +38,7 @@ generate_kwargs = dict(
|
|
38 |
llama_guard, llama_guard_tokenizer, UNSAFE_TOKEN_ID = load_llama_guard("meta-llama/Llama-Guard-3-1B")
|
39 |
|
40 |
## RAG MODEL
|
41 |
-
RAG = RAGPretrainedModel.from_index("colbert/indexes/arxiv_colbert", n_gpu=
|
42 |
|
43 |
try:
|
44 |
gr.Info("Setting up retriever, please wait...")
|
@@ -141,7 +141,7 @@ with gr.Blocks(theme = gr.themes.Soft()) as demo:
|
|
141 |
input = gr.Textbox(visible=False) # placeholder
|
142 |
gr_md = gr.Markdown(mark_text + md_text_initial)
|
143 |
|
144 |
-
@spaces.GPU(duration=60)
|
145 |
def update_with_rag_md(message, llm_results_use = 5, database_choice = index_info, llm_model_picked = 'Trust-Align-Qwen2.5'):
|
146 |
chat_round = [
|
147 |
{"role": "user",
|
|
|
38 |
llama_guard, llama_guard_tokenizer, UNSAFE_TOKEN_ID = load_llama_guard("meta-llama/Llama-Guard-3-1B")
|
39 |
|
40 |
## RAG MODEL
|
41 |
+
RAG = RAGPretrainedModel.from_index("colbert/indexes/arxiv_colbert", n_gpu=0)
|
42 |
|
43 |
try:
|
44 |
gr.Info("Setting up retriever, please wait...")
|
|
|
141 |
input = gr.Textbox(visible=False) # placeholder
|
142 |
gr_md = gr.Markdown(mark_text + md_text_initial)
|
143 |
|
144 |
+
# @spaces.GPU(duration=60)
|
145 |
def update_with_rag_md(message, llm_results_use = 5, database_choice = index_info, llm_model_picked = 'Trust-Align-Qwen2.5'):
|
146 |
chat_round = [
|
147 |
{"role": "user",
|