Spaces:
Running
Running
Quentin Lhoest
commited on
Commit
Β·
bdf93e0
1
Parent(s):
c2de6fa
update tags
Browse files
.gitattributes
CHANGED
|
@@ -26,3 +26,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
| 27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
*.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 26 |
*.zstandard filter=lfs diff=lfs merge=lfs -text
|
| 27 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 28 |
*.json filter=lfs diff=lfs merge=lfs -text
|
| 29 |
+
metadata_942418870f35246ce32d98caf3f230024a58428b.json filter=lfs diff=lfs merge=lfs -text
|
metadata_526dba9dce6f983ebcacd65bef35a868a5735df6.json β metadata_942418870f35246ce32d98caf3f230024a58428b.json
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7052da9dcb564799fdfb47ac8f50232fd3022e8d14023d76c280c51eb613e405
|
| 3 |
+
size 30721389
|
requirements.txt
CHANGED
|
@@ -1,4 +1,4 @@
|
|
| 1 |
pyyaml
|
| 2 |
streamlit>=0.88.0
|
| 3 |
langcodes[data]
|
| 4 |
-
datasets
|
|
|
|
| 1 |
pyyaml
|
| 2 |
streamlit>=0.88.0
|
| 3 |
langcodes[data]
|
| 4 |
+
git+https://github.com/huggingface/datasets@7e514c3#egg=datasets
|
tagging_app.py
CHANGED
|
@@ -76,10 +76,10 @@ def multiselect(
|
|
| 76 |
return w.multiselect(markdown, valid_set, default=valid_values, format_func=format_func, key=title)
|
| 77 |
|
| 78 |
|
| 79 |
-
def
|
| 80 |
try:
|
| 81 |
-
DatasetMetadata(
|
| 82 |
-
if not
|
| 83 |
raise ValueError("Please specify a non-empty Dataset name.")
|
| 84 |
w.markdown("β
This is a valid tagset! π€")
|
| 85 |
except Exception as e:
|
|
@@ -168,10 +168,11 @@ if leftbtn.button("pre-load"):
|
|
| 168 |
state = initial_state or new_state()
|
| 169 |
st.experimental_set_query_params(preload_dataset=preloaded_id)
|
| 170 |
if not is_state_empty(state):
|
| 171 |
-
if rightbtn.button("
|
| 172 |
state = new_state()
|
| 173 |
initial_state = None
|
| 174 |
preloaded_id = None
|
|
|
|
| 175 |
st.experimental_set_query_params()
|
| 176 |
|
| 177 |
if preloaded_id is not None and initial_state is not None:
|
|
@@ -181,7 +182,7 @@ if preloaded_id is not None and initial_state is not None:
|
|
| 181 |
The current base tagset is [`{preloaded_id}`](https://huggingface.co/datasets/{preloaded_id})
|
| 182 |
"""
|
| 183 |
)
|
| 184 |
-
|
| 185 |
st.sidebar.markdown(
|
| 186 |
f"""
|
| 187 |
Here is the matching yaml block:
|
|
@@ -382,7 +383,7 @@ rightcol.markdown(
|
|
| 382 |
if is_state_empty(state):
|
| 383 |
rightcol.markdown("β This is an invalid tagset: it's empty!")
|
| 384 |
else:
|
| 385 |
-
|
| 386 |
|
| 387 |
|
| 388 |
rightcol.markdown(
|
|
@@ -400,5 +401,4 @@ This is a standalone tool, it is useful to check for errors on an existing tagse
|
|
| 400 |
|
| 401 |
yamlblock = rightcol.text_area("Input your yaml here")
|
| 402 |
if yamlblock.strip() != "":
|
| 403 |
-
|
| 404 |
-
validate_dict(rightcol, inputdict)
|
|
|
|
| 76 |
return w.multiselect(markdown, valid_set, default=valid_values, format_func=format_func, key=title)
|
| 77 |
|
| 78 |
|
| 79 |
+
def validate_yaml(w: st.delta_generator.DeltaGenerator, yamlblock: str):
|
| 80 |
try:
|
| 81 |
+
DatasetMetadata.from_yaml_string(yamlblock)
|
| 82 |
+
if "pretty_name: " not in yamlblock or "pretty_name: ''" in yamlblock:
|
| 83 |
raise ValueError("Please specify a non-empty Dataset name.")
|
| 84 |
w.markdown("β
This is a valid tagset! π€")
|
| 85 |
except Exception as e:
|
|
|
|
| 168 |
state = initial_state or new_state()
|
| 169 |
st.experimental_set_query_params(preload_dataset=preloaded_id)
|
| 170 |
if not is_state_empty(state):
|
| 171 |
+
if rightbtn.button("reset"):
|
| 172 |
state = new_state()
|
| 173 |
initial_state = None
|
| 174 |
preloaded_id = None
|
| 175 |
+
initial_infos = None
|
| 176 |
st.experimental_set_query_params()
|
| 177 |
|
| 178 |
if preloaded_id is not None and initial_state is not None:
|
|
|
|
| 182 |
The current base tagset is [`{preloaded_id}`](https://huggingface.co/datasets/{preloaded_id})
|
| 183 |
"""
|
| 184 |
)
|
| 185 |
+
validate_yaml(st.sidebar, yaml.dump(initial_state))
|
| 186 |
st.sidebar.markdown(
|
| 187 |
f"""
|
| 188 |
Here is the matching yaml block:
|
|
|
|
| 383 |
if is_state_empty(state):
|
| 384 |
rightcol.markdown("β This is an invalid tagset: it's empty!")
|
| 385 |
else:
|
| 386 |
+
validate_yaml(rightcol, yaml.dump(state))
|
| 387 |
|
| 388 |
|
| 389 |
rightcol.markdown(
|
|
|
|
| 401 |
|
| 402 |
yamlblock = rightcol.text_area("Input your yaml here")
|
| 403 |
if yamlblock.strip() != "":
|
| 404 |
+
validate_yaml(rightcol, yamlblock)
|
|
|