asoria HF staff commited on
Commit
2a80b42
1 Parent(s): 42a85d0

Change index by dataset name only without user namespace

Browse files
Files changed (1) hide show
  1. app.py +2 -6
app.py CHANGED
@@ -88,7 +88,7 @@ def dataset_with_info(dataset):
88
  "downloads": dataset.downloads,
89
  "created_at": dataset.created_at,
90
  "tags": dataset.tags,
91
- "text": f"{dataset.id}-{','.join(list(columns.keys()))}",
92
  }
93
  except Exception as e:
94
  logger.error(f"Failed to get info for {dataset.id}: {e}")
@@ -134,7 +134,6 @@ def search(dataset_name, k):
134
  print(f"start search for {dataset_name}")
135
  try:
136
  dataset_row = all_datasets_df[all_datasets_df.dataset == dataset_name].iloc[0]
137
- print(dataset_row)
138
  except IndexError:
139
  return pd.DataFrame([{"error": "❌ Dataset does not exist or is not supported"}])
140
  text = dataset_row["text"]
@@ -143,12 +142,9 @@ def search(dataset_name, k):
143
  faiss.normalize_L2(_vector)
144
  distances, ann = index.search(_vector, k=k)
145
  results = pd.DataFrame({"distances": distances[0], "ann": ann[0]})
146
- print("results for distances and ann")
147
- print(results)
148
  merge = pd.merge(results, all_datasets_df, left_on="ann", right_index=True)
149
- print("resultst for merged df (distances,ann, dataset info)")
150
  merge["dataset"] = merge["dataset"].apply(render_model_hub_link)
151
- return merge
152
 
153
 
154
  with gr.Blocks() as demo:
 
88
  "downloads": dataset.downloads,
89
  "created_at": dataset.created_at,
90
  "tags": dataset.tags,
91
+ "text": f"{str(dataset.id).split('/')[-1]}-{','.join(list(columns.keys()))}",
92
  }
93
  except Exception as e:
94
  logger.error(f"Failed to get info for {dataset.id}: {e}")
 
134
  print(f"start search for {dataset_name}")
135
  try:
136
  dataset_row = all_datasets_df[all_datasets_df.dataset == dataset_name].iloc[0]
 
137
  except IndexError:
138
  return pd.DataFrame([{"error": "❌ Dataset does not exist or is not supported"}])
139
  text = dataset_row["text"]
 
142
  faiss.normalize_L2(_vector)
143
  distances, ann = index.search(_vector, k=k)
144
  results = pd.DataFrame({"distances": distances[0], "ann": ann[0]})
 
 
145
  merge = pd.merge(results, all_datasets_df, left_on="ann", right_index=True)
 
146
  merge["dataset"] = merge["dataset"].apply(render_model_hub_link)
147
+ return merge.drop("text", axis=1)
148
 
149
 
150
  with gr.Blocks() as demo: