Spaces:

imageomics
/

bioclip-2-demo

Running

App Files Files Community

thompsonmj commited on Jun 10

Commit

cb3900a

verified ·

1 Parent(s): fd1374f

Update metadata.parquet with "gbif_taxon_id" (#3)

Browse files

- Use gbif_taxon_id for GBIF link lookup (e6ca92128986db5f685798081d91fc6d38815a7d)

Files changed (2) hide show

components/metadata.parquet +2 -2
components/query.py +6 -6

components/metadata.parquet CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6af05f1f8f08b0d447b9a4c18680c7de39551a05318f026d30c224a9bbe5283e
-size 121162891

 version https://git-lfs.github.com/spec/v1
+oid sha256:bc17e3263f1e735162c5f4f3356c297b3723002258698190657d93f759bd669f
+size 131082909

components/query.py CHANGED Viewed

@@ -42,7 +42,7 @@ def get_sample(df, pred_taxon, rank):
     '''
     logger.info(f"Getting sample for taxon: {pred_taxon} at rank: {rank}")
     try:
-        filepath, gbif_id, eol_page_id, full_name, is_exact = get_sample_data(df, pred_taxon, rank)
     except Exception as e:
         logger.error(f"Error retrieving sample data: {e}")
         return None, f"We encountered the following error trying to retrieve a sample image: {e}."
@@ -58,8 +58,8 @@ def get_sample(df, pred_taxon, rank):
                                                    )
         img_resp = requests.get(img_src)
         img = Image.open(io.BytesIO(img_resp.content))
-        if gbif_id:
-            gbif_url = GBIF_URL + gbif_id
             if eol_page_id:
                 eol_url = EOL_URL + eol_page_id
                 if is_exact:
@@ -100,7 +100,7 @@ def get_sample_data(df, pred_taxon, rank):
     --------
     filepath : str
         Filepath of selected sample image for predicted taxon.
-    gbif_id: str
         GBIF page ID associated with predicted taxon for more information.
     eol_page_id : str
         EOL page ID associated with predicted taxon for more information.
@@ -125,9 +125,9 @@ def get_sample_data(df, pred_taxon, rank):
     if exact_df.shape[0] > 0:
         df_filtered = exact_df.sample()
         full_name = " ".join(df_filtered.select(RANKS[:rank+1]).row(0))
-        return df_filtered["file_path"][0], df_filtered["gbif_id"].cast(pl.String)[0], df_filtered["eol_page_id"].cast(pl.String)[0], full_name, True
     # If no exact matches, return any entry with the specified rank
     df_filtered = df.sample()
     full_name = " ".join(df_filtered.select(RANKS[:rank+1]).row(0)) + " " + " ".join(df_filtered.select(RANKS[rank+1:]).row(0))
-    return df_filtered["file_path"][0], df_filtered["gbif_id"].cast(pl.String)[0], df_filtered["eol_page_id"].cast(pl.String)[0], full_name, False

     '''
     logger.info(f"Getting sample for taxon: {pred_taxon} at rank: {rank}")
     try:
+        filepath, gbif_taxon_id, eol_page_id, full_name, is_exact = get_sample_data(df, pred_taxon, rank)
     except Exception as e:
         logger.error(f"Error retrieving sample data: {e}")
         return None, f"We encountered the following error trying to retrieve a sample image: {e}."
                                                    )
         img_resp = requests.get(img_src)
         img = Image.open(io.BytesIO(img_resp.content))
+        if gbif_taxon_id:
+            gbif_url = GBIF_URL + gbif_taxon_id
             if eol_page_id:
                 eol_url = EOL_URL + eol_page_id
                 if is_exact:
     --------
     filepath : str
         Filepath of selected sample image for predicted taxon.
+    gbif_taxon_id: str
         GBIF page ID associated with predicted taxon for more information.
     eol_page_id : str
         EOL page ID associated with predicted taxon for more information.
     if exact_df.shape[0] > 0:
         df_filtered = exact_df.sample()
         full_name = " ".join(df_filtered.select(RANKS[:rank+1]).row(0))
+        return df_filtered["file_path"][0], df_filtered["gbif_taxon_id"].cast(pl.String)[0], df_filtered["eol_page_id"].cast(pl.String)[0], full_name, True
     # If no exact matches, return any entry with the specified rank
     df_filtered = df.sample()
     full_name = " ".join(df_filtered.select(RANKS[:rank+1]).row(0)) + " " + " ".join(df_filtered.select(RANKS[rank+1:]).row(0))
+    return df_filtered["file_path"][0], df_filtered["gbif_taxon_id"].cast(pl.String)[0], df_filtered["eol_page_id"].cast(pl.String)[0], full_name, False