1+ from __future__ import annotations
2+
13import random
2- from typing import Any , Dict , List
4+ from typing import Any
35
46import augmenty
57import catalogue
1517
1618
1719@datasets .register ("dane" )
18- def dane () -> Dict [str , List [Example ]]:
20+ def dane () -> dict [str , list [Example ]]:
1921 from dacy .datasets import dane as _dane
2022
2123 train , dev , test = _dane (splits = ["train" , "dev" , "test" ]) # type: ignore
@@ -34,7 +36,7 @@ def augment_dataset(
3436 augmenters : dict ,
3537 n_rep : int = 20 ,
3638 split : str = "test" ,
37- ) -> List [Example ]:
39+ ) -> list [Example ]:
3840 # ensure seed
3941 random .seed (42 )
4042 np .random .seed (42 )
@@ -63,25 +65,25 @@ def augment_dataset(
6365
6466
6567@datasets .register ("gender_bias_dane" )
66- def dane_gender_bias () -> Dict [str , List [Example ]]:
68+ def dane_gender_bias () -> dict [str , list [Example ]]:
6769 return {"test" : augment_dataset ("dane" , augmenters = get_gender_bias_augmenters ())}
6870
6971
7072@datasets .register ("robustness_dane" )
71- def dane_robustness () -> Dict [str , List [Example ]]:
73+ def dane_robustness () -> dict [str , list [Example ]]:
7274 return {"test" : augment_dataset ("dane" , augmenters = get_robustness_augmenters ())}
7375
7476
7577@datasets .register ("dansk" )
76- def dansk (** kwargs : Any ) -> Dict [str , List [Example ]]:
78+ def dansk (** kwargs : Any ) -> dict [str , list [Example ]]:
7779 splits = ["train" , "dev" , "test" ]
7880
7981 if not Doc .has_extension ("meta" ):
8082 Doc .set_extension ("meta" , default = {}, force = True )
8183
8284 nlp = spacy .blank ("da" )
8385
84- def convert_to_doc (example : Dict ) -> Doc :
86+ def convert_to_doc (example : dict ) -> Doc :
8587 doc = Doc (nlp .vocab ).from_json (example )
8688 # set metadata
8789 for k in ["dagw_source" , "dagw_domain" , "dagw_source_full" ]:
0 commit comments