Segizu commited on
Commit
ae0535c
Β·
1 Parent(s): 8d88e43

metadata v12

Browse files
Files changed (3) hide show
  1. app.py +6 -3
  2. metadata.csv +0 -0
  3. metadata.py +1 -1
app.py CHANGED
@@ -18,10 +18,13 @@ EMBEDDINGS_FILE = EMBEDDINGS_DIR / "embeddings.pkl"
18
 
19
  # βœ… Cargar dataset directamente desde Hugging Face Hub
20
  dataset = load_dataset(
21
- path="Segizu/facial-recognition",
22
  data_files="metadata.csv",
23
- token=HF_TOKEN
24
- )
 
 
 
25
  dataset = dataset["train"].cast_column("image", HfImage())
26
 
27
  # πŸ”„ Preprocesar imagen para Facenet
 
18
 
19
  # βœ… Cargar dataset directamente desde Hugging Face Hub
20
  dataset = load_dataset(
21
+ "csv",
22
  data_files="metadata.csv",
23
+ split="train",
24
+ column_names=["image"] # βœ… Forzar encabezado correcto
25
+ )
26
+ print("βœ… Primer item:", dataset[0])
27
+
28
  dataset = dataset["train"].cast_column("image", HfImage())
29
 
30
  # πŸ”„ Preprocesar imagen para Facenet
metadata.csv CHANGED
The diff for this file is too large to render. See raw diff
 
metadata.py CHANGED
@@ -9,7 +9,7 @@ api = HfApi()
9
  files = api.list_repo_files(repo_id=repo_id, repo_type="dataset", token=HF_TOKEN)
10
 
11
  # Generar URLs completas
12
- base_url = f""
13
  image_urls = [base_url + f for f in files if f.lower().endswith(".jpg")]
14
 
15
  # Escribir nuevo metadata.csv
 
9
  files = api.list_repo_files(repo_id=repo_id, repo_type="dataset", token=HF_TOKEN)
10
 
11
  # Generar URLs completas
12
+ base_url = f"https://huggingface.co/datasets/{repo_id}/resolve/main/"
13
  image_urls = [base_url + f for f in files if f.lower().endswith(".jpg")]
14
 
15
  # Escribir nuevo metadata.csv