create very light and simple data lakes
Install for Python:
pip install cerulean-pond
from cerulean_pond import Data_Pond
# Initialize the library
dp = Data_Pond()
# Authenticate
dp.authenticate("username", "password")
# List projects
projects = dp.list_projects()
# List files
files = dp.list_files()
# Upload a file
dp.upload_file("/path/to/file.csv", "ProjectName")
# Load file into DataFrame
df = dp.load_file_to_dataframe("file.csv", "ProjectName")
# Load parquet file into DataFrame
loaded_df = dp.load_parquet_to_dataframe(file_name="file.parquet", project="ProjectName")
# Upload a parquet file
dp.upload_parquet(df, project="ProjectName", custom_filename="file.parquet")