Spaces:
Runtime error
Runtime error
Support csv files and single label scenarios
Browse files
app.py
CHANGED
@@ -45,7 +45,10 @@ def draw_interactive_scatter_plot(
|
|
45 |
# Normalize values to range between 0-255, to assign a color for each value
|
46 |
max_value = values.max()
|
47 |
min_value = values.min()
|
48 |
-
|
|
|
|
|
|
|
49 |
values_color_set = sorted(values_color)
|
50 |
|
51 |
values_list = values.astype(str).tolist()
|
@@ -59,9 +62,12 @@ def draw_interactive_scatter_plot(
|
|
59 |
return p
|
60 |
|
61 |
|
62 |
-
def generate_plot(
|
63 |
logger.info("Loading dataset in memory")
|
64 |
-
|
|
|
|
|
|
|
65 |
if label_column not in df.columns:
|
66 |
df[label_column] = 0
|
67 |
df = df.dropna(subset=[text_column, label_column])
|
|
|
45 |
# Normalize values to range between 0-255, to assign a color for each value
|
46 |
max_value = values.max()
|
47 |
min_value = values.min()
|
48 |
+
if max_value - min_value == 0:
|
49 |
+
values_color = np.ones(len(values))
|
50 |
+
else:
|
51 |
+
values_color = ((values - min_value) / (max_value - min_value) * 255).round().astype(int).astype(str)
|
52 |
values_color_set = sorted(values_color)
|
53 |
|
54 |
values_list = values.astype(str).tolist()
|
|
|
62 |
return p
|
63 |
|
64 |
|
65 |
+
def generate_plot(uploaded_file: st.uploaded_file_manager.UploadedFile, text_column: str, label_column: str, sample: Optional[int], model: SentenceTransformer):
|
66 |
logger.info("Loading dataset in memory")
|
67 |
+
extension = uploaded_file.name.split(".")[-1]
|
68 |
+
df = pd.read_csv(uploaded_file, sep="\t" if extension == "tsv" else ",")
|
69 |
+
if text_column not in df.columns:
|
70 |
+
raise ValueError("The specified column name doesn't exist")
|
71 |
if label_column not in df.columns:
|
72 |
df[label_column] = 0
|
73 |
df = df.dropna(subset=[text_column, label_column])
|