import smallpond # Initialize session sp = smallpond.init() # Load data df = sp.read_parquet("prices.parquet") # Process data df = df.repartition(3, hash_by="ticker") df = sp.partial_sql("SELECT ticker, min(price), max(price) FROM {0} GROUP BY ticker", df) # Save results df.write_parquet("output/") # Show results print(df.to_pandas())
Smallpond
Creator
Creator
Seonglae ChoCreated
Created
2025 Mar 6 23:9Editor
Editor
Seonglae ChoEdited
Edited
2025 Mar 6 23:10Refs
Refs