import duckdb
con = duckdb.connect(database=":memory:")
con.execute("INSTALL httpfs;")
con.execute("LOAD httpfs;")
# query_definition = f"SELECT * FROM read_parquet('s3://projet-formation/diffusion/funathon/2026/project2/generation_None_temp08.parquet')"
query_definition = f"SELECT * FROM read_parquet('https://minio.lab.sspcloud.fr/projet-formation/diffusion/funathon/2026/project2/generation_None_temp08.parquet')"
annotations = con.sql(query_definition).to_df()
annotations.head()| code | name | label | |
|---|---|---|---|
| 0 | 01.11 | Growing of cereals, other than rice, leguminou... | Pulses cultivation for market |
| 1 | 01.11 | Growing of cereals, other than rice, leguminou... | Legume crop production activities |
| 2 | 01.11 | Growing of cereals, other than rice, leguminou... | Broad bean farming operations |
| 3 | 01.11 | Growing of cereals, other than rice, leguminou... | Chickpea harvesting and processing |
| 4 | 01.11 | Growing of cereals, other than rice, leguminou... | Production of dried beans and peas |