DLesmes commited on
Commit
1f947ee
·
1 Parent(s): 2c0e246

adding the hf hub and dataloaders to gather the data from a private hf dataset

Browse files
Files changed (2) hide show
  1. requirements.txt +3 -1
  2. src/services/api.py +20 -6
requirements.txt CHANGED
@@ -2,4 +2,6 @@ altair
2
  pandas
3
  streamlit
4
  folium==0.16.0
5
- streamlit-folium==0.18.0
 
 
 
2
  pandas
3
  streamlit
4
  folium==0.16.0
5
+ streamlit-folium==0.18.0
6
+ huggingface_hub>=0.21
7
+ datasets
src/services/api.py CHANGED
@@ -1,11 +1,25 @@
1
- import requests
 
 
2
 
3
- BACKEND_URL = "http://backend:8000" # Use "http://localhost:8000" for local dev
 
 
 
4
 
5
- def get_visits_by_date(date):
6
  try:
7
- resp = requests.get(f"{BACKEND_URL}/api/visits", params={"end_date": date})
8
- resp.raise_for_status()
9
- return resp.json().get("data", [])
 
 
 
 
 
10
  except Exception as e:
 
11
  return []
 
 
 
 
 
1
+ import os
2
+ from typing import List, Dict, Any
3
+ from datasets import load_dataset
4
 
5
+ def get_visits_by_date(date: str) -> List[Dict[str, Any]]:
6
+ hf_token = os.getenv("HF_TOKEN")
7
+ if not hf_token:
8
+ return []
9
 
 
10
  try:
11
+ # Load the dataset from the specific branch
12
+ ds = load_dataset(
13
+ "uriels-locations/visits",
14
+ data_files="visitas_business_days_by_day_sample.json",
15
+ revision="refs/pr/2",
16
+ split="train",
17
+ use_auth_token=hf_token
18
+ )
19
  except Exception as e:
20
+ # Log error as needed
21
  return []
22
+
23
+ # Filter by date (assuming 'date' field exists)
24
+ filtered = [item for item in ds if item.get("date") == date]
25
+ return filtered