Petr Tsvetkov
commited on
Commit
·
2f5bdc0
1
Parent(s):
64ddd9b
Save each flagegd sample to a separate dir to avoid too big csv fields; decrease the keylogger record size
Browse files
app.py
CHANGED
@@ -17,7 +17,7 @@ data = load_data()
|
|
17 |
|
18 |
n_samples = len(data)
|
19 |
|
20 |
-
saver = get_dataset_saver(HF_TOKEN, HF_DATASET, private=True)
|
21 |
|
22 |
|
23 |
def convert_diff_to_unified(diff_string):
|
@@ -53,7 +53,7 @@ def get_github_link_md(repo, hash):
|
|
53 |
|
54 |
|
55 |
def char_diff_obj(change_type, pos, character, timestamp):
|
56 |
-
return {"
|
57 |
|
58 |
|
59 |
def update_commit_view(sample_ind):
|
|
|
17 |
|
18 |
n_samples = len(data)
|
19 |
|
20 |
+
saver = get_dataset_saver(HF_TOKEN, HF_DATASET, private=True, separate_dirs=True)
|
21 |
|
22 |
|
23 |
def convert_diff_to_unified(diff_string):
|
|
|
53 |
|
54 |
|
55 |
def char_diff_obj(change_type, pos, character, timestamp):
|
56 |
+
return {"t": change_type, "p": pos, "c": character, "ts": timestamp}
|
57 |
|
58 |
|
59 |
def update_commit_view(sample_ind):
|