import pandas as pd
import gradio as gr
from datasets import load_dataset
#dataset = load_dataset("laion/laion2B-en-joined") too big space evicted
#dataset = load_dataset("laion/laion-coco") # try smaller? evicted again. try try again
#dataset = load_dataset("laion/laion400m") # smaller still - you can do it!
dataset = load_dataset("laion/laion-art") # 1.2G? parquet
print(dataset.features)
print (type(dataset))
df = pd.DataFrame(dataset)
#df = pd.read_csv("images.csv")
#df['url'] = df['URL'].apply(lambda x: ' ')
#df = df[[ 'URL', 'TEXT']]
def display_df():
df_images = df.head(100)
return df_images
def display_next100(dataframe, end):
dataframe = dataframe.sample(frac=1)
start = (end or dataframe.index[-1]) + 1
end = start + 99
df_images = df.loc[start:end]
return df_images, end
with gr.Blocks() as demo:
gr.Markdown("