comparator / src /hub.py
albertvillanova's picture
Fix loading Details with documents containing end of lines
662ed4b verified
raw
history blame
620 Bytes
import io
import json
import httpx
from huggingface_hub import hf_hub_url
from huggingface_hub.utils import build_hf_headers
client = httpx.AsyncClient()
async def load_file(path):
url = to_url(path)
r = await client.get(url)
return r.json()
async def load_details_file(path):
url = to_url(path)
r = await client.get(url, headers=build_hf_headers())
f = io.StringIO(r.text)
return [json.loads(line) for line in f]
def to_url(path):
_, org_name, ds_name, filename = path.split("/", 3)
return hf_hub_url(repo_id=f"{org_name}/{ds_name}", filename=filename, repo_type="dataset")