Spaces:

PledgeTracker
/

Pledge_Tracker

Starting on A100

yulongchen commited on Jun 15

Commit

602a998

1 Parent(s): e30c3ac

Add system

Files changed (3) hide show

system/augmented_searching.py CHANGED Viewed

@@ -45,7 +45,7 @@ def ensure_directory_exists(path):
         raise ValueError(f"[ERROR] Unsafe path: {dir_path}")
     dir_path.mkdir(parents=True, exist_ok=True)
-def run_augmented_searching(qa_file, pipeline_base_dir, suggestion_meta, pledge_author, start_date, end_date, user_id, claim_id):
     if suggestion_meta==None:
         qa_lines = open(f"{qa_file}","r").read()
         qa_lines = json.loads(qa_lines)
@@ -95,5 +95,5 @@ def run_augmented_searching(qa_file, pipeline_base_dir, suggestion_meta, pledge_
     urls = list(dict.fromkeys(urls))
     save_tsv(str(tsv_file_path), [0] * len(urls), string_values, urls, queries)
-    print(f"[SYSTEM] Saved {len(urls)} URLs for claim {claim_id} to {tsv_file_path}")
     return str(tsv_file_path)

         raise ValueError(f"[ERROR] Unsafe path: {dir_path}")
     dir_path.mkdir(parents=True, exist_ok=True)
+def run_augmented_searching(qa_file, pipeline_base_dir, suggestion_meta, pledge_author, start_date, end_date):
     if suggestion_meta==None:
         qa_lines = open(f"{qa_file}","r").read()
         qa_lines = json.loads(qa_lines)
     urls = list(dict.fromkeys(urls))
     save_tsv(str(tsv_file_path), [0] * len(urls), string_values, urls, queries)
+    print(f"[SYSTEM] Saved {len(urls)} URLs for claim {idx} to {tsv_file_path}")
     return str(tsv_file_path)

system/pledge_tracking.py CHANGED Viewed

@@ -104,9 +104,10 @@ def run_pipeline(claim, pledge_date, pledge_author, start_date, timestamp, user_
                 repo_type="dataset",
                 token=os.environ["HF_TOKEN"]
             )
-        with open(qa_file_path, "r", encoding="utf-8") as f:
-            questions = {line["question"] for line in json.load(f)["evidence"]}
-            line_count = len(questions)
         if update_fn:
             update_fn(step_id, f"relevant queries are generated, for example:\n"
                       f"{questions[0]}\n"
@@ -124,9 +125,10 @@ def run_pipeline(claim, pledge_date, pledge_author, start_date, timestamp, user_
         start_date=start_date,
         suggestion_meta=suggestion_meta,
         end_date="",
-        user_id=user_id,
-        claim_id=0,
     )
     with open(augmented_tsv_file, "r", encoding="utf-8") as f:
         line_count = sum(1 for line in f)
     if update_fn:

                 repo_type="dataset",
                 token=os.environ["HF_TOKEN"]
             )
+        idx = suggestion_meta["index"]
+        qa_lines = open(f"{qa_file_path}","r").readlines()[idx]
+        questions = {line["question"] for line in json.load(qa_lines)["evidence"]}
+        line_count = len(questions)
         if update_fn:
             update_fn(step_id, f"relevant queries are generated, for example:\n"
                       f"{questions[0]}\n"
         start_date=start_date,
         suggestion_meta=suggestion_meta,
         end_date="",
     )
     with open(augmented_tsv_file, "r", encoding="utf-8") as f:
         line_count = sum(1 for line in f)
     if update_fn:

test.html CHANGED Viewed

@@ -387,7 +387,7 @@
             const author = "Labour";
             const date = "2024-07-04";
             suggestionBox.innerHTML =
-              "<div class='font-semibold mb-1'>💡 Are you fact-checking ... </div>" +
               "<ul class='list-disc ml-6 mt-1'>" +
               suggestions.map(s => `
                 <li class="mb-2">

             const author = "Labour";
             const date = "2024-07-04";
             suggestionBox.innerHTML =
+              "<div class='font-semibold mb-1'>💡 Are you fact-checking this pledge? </div>" +
               "<ul class='list-disc ml-6 mt-1'>" +
               suggestions.map(s => `
                 <li class="mb-2">