Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
15 changes: 15 additions & 0 deletions .github/workflows/test.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
name: Test
on:
push:
branches:
- master
pull_request:
types: [opened, synchronize]

jobs:
test:
runs-on: ubuntu-20.04

steps:
- name: Run tests
run: make test
2 changes: 2 additions & 0 deletions Makefile
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
test:
pytest tests
Empty file added notebooks/__init__.py
Empty file.
134 changes: 85 additions & 49 deletions notebooks/tutorial.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -32,16 +32,17 @@
"outputs": [],
"source": [
"char_aug = CharAug(\n",
" unit_prob=0.3, # Процент фразы к которой будут применены аугментации\n",
" min_aug=1, # Минимальное количество аугментаций\n",
" max_aug=5, # Максимальное количество аугментаций\n",
" mult_num=3, # Максимальное количество повторений символов (только для метода multiply)\n",
" unit_prob=0.3,\n",
" min_aug=1,\n",
" max_aug=5,\n",
" mult_num=3,\n",
" random_seed=42,\n",
" lang=\"eng\",\n",
" lang=\"rus\",\n",
" platform=\"pc\",\n",
" )\n",
"\n",
"text = \"Screw you guys, I am going home. (c)\""
"# text = \"Screw you guys, I am going home. (c)\"\n",
"text = \"Привет, как дела?\""
]
},
{
Expand All @@ -56,7 +57,7 @@
{
"data": {
"text/plain": [
"'Scorew yotu guys,u hI kam going home. (c)'"
"'Пнривыеут, как ждела?с'"
]
},
"execution_count": 3,
Expand Down Expand Up @@ -102,7 +103,7 @@
{
"data": {
"text/plain": [
"'Screw YoU guys, I am going Home. (C)'"
"'ПРивЕт, каК дела?'"
]
},
"execution_count": 5,
Expand All @@ -127,7 +128,7 @@
{
"data": {
"text/plain": [
"'Sedew you guya, I am going home. (c)'"
"'Пёевет, как дида?'"
]
},
"execution_count": 6,
Expand All @@ -152,7 +153,7 @@
{
"data": {
"text/plain": [
"'Sxrew you gugs, I am going home. (x)'"
"'Привет, евк дела?'"
]
},
"execution_count": 7,
Expand All @@ -173,7 +174,7 @@
{
"data": {
"text/plain": [
"'crew you guys Iam goinghme. (c)'"
"'Приеткк дла?'"
]
},
"execution_count": 8,
Expand All @@ -194,7 +195,7 @@
{
"data": {
"text/plain": [
"'Screw you ughuys, I vam gcoing hxome. (c)'"
"'Пцриувет, кбак дьелба?'"
]
},
"execution_count": 9,
Expand All @@ -215,7 +216,7 @@
{
"data": {
"text/plain": [
"'Screw yyou guyss, I am ggoinng home. (c)'"
"'Приивеет, какк дела?'"
]
},
"execution_count": 10,
Expand All @@ -236,7 +237,7 @@
{
"data": {
"text/plain": [
"'Srcewy ou guys,I am oging hmoe. (c)'"
"'рПвие,т кка длеа?'"
]
},
"execution_count": 11,
Expand All @@ -257,16 +258,16 @@
{
"data": {
"text/plain": [
"['Screw you guyss, I am going home. (c)',\n",
" 'Screw eou guys, I em goifg home. (c)',\n",
"['Scre you guy, Iam gng home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you yuys, I am goibg hone. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw youg uys, Iam igong hmoe. (c)',\n",
" 'ScRew You guys6 I Am going home. (c)',\n",
" 'Screwyu guys, I am goig hoe. ()',\n",
" 'Screw you buys, I am go9mg ho,e. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Srcwe you gyus, Ia m giong home. (c)',\n",
" 'Screw you guys, I am going home. (c)']"
" 'Screw you guys, I am going home. (c)',\n",
" 'ScreW you guYs, I Am goIng home. (c0']"
]
},
"execution_count": 12,
Expand All @@ -280,6 +281,40 @@
"char_aug.aug_batch(text_list, batch_prob=0.5)"
]
},
{
"cell_type": "code",
"execution_count": 32,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"['Привет, как дела?',\n",
" 'Питвет, как днда?',\n",
" 'Пииват, ка5 дела?',\n",
" 'Привет, как дела?',\n",
" 'Привет, как дела?']"
]
},
"execution_count": 32,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"text = \"Привет, как дела?\"\n",
"char_aug.aug_batch(\n",
" batch=[text] * 5,\n",
" batch_prob=0.5, \n",
" action=\"typo\"\n",
" )\n",
"\n",
"\n",
"\n",
"\n",
"\n"
]
},
{
"cell_type": "code",
"execution_count": 13,
Expand All @@ -289,15 +324,15 @@
"data": {
"text/plain": [
"['Screw you guys, I am going home. (c)',\n",
" 'Screw youu guys, II am goingg home. (c)',\n",
" 'Scrreew you guys, I am going home. (c)',\n",
" 'Screww you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guyss, I am goingg home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, II am going home. (c)',\n",
" 'Screw you guys, II am going hhome. (c))',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Scrrew you guys, I am goingg home. (c)',\n",
" 'Screw you guys, I am going home. (c)']"
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am goinng home. (c)']"
]
},
"execution_count": 13,
Expand Down Expand Up @@ -335,15 +370,16 @@
"outputs": [],
"source": [
"word_aug = WordAug(\n",
" unit_prob=0.4, # Процент фразы к которой будут применены аугментации\n",
" min_aug=1, # Минимальное количество аугментаций\n",
" max_aug=5, # Максимальное количество аугментаций\n",
" unit_prob=0.4,\n",
" min_aug=1,\n",
" max_aug=5,\n",
" random_seed=42,\n",
" lang=\"eng\",\n",
" lang=\"rus\",\n",
" platform=\"pc\",\n",
" )\n",
"\n",
"text = \"Screw you guys, I am going home. (c)\""
"# text = \"Screw you guys, I am going home. (c)\"\n",
"text = \"Привет, как дела?\""
]
},
{
Expand All @@ -354,7 +390,7 @@
{
"data": {
"text/plain": [
"'S c r e w y o u guys, I am g o i n g home. (c)'"
"'Привет, как д е л а ?'"
]
},
"execution_count": 16,
Expand Down Expand Up @@ -403,7 +439,7 @@
{
"data": {
"text/plain": [
"'Screw to guys, I to going com. (c)'"
"'пркет, как дела?'"
]
},
"execution_count": 18,
Expand All @@ -424,7 +460,7 @@
{
"data": {
"text/plain": [
"'you I am home. (c)'"
"'как дела?'"
]
},
"execution_count": 19,
Expand All @@ -445,7 +481,7 @@
{
"data": {
"text/plain": [
"'Screw I guys, am home. going you (c)'"
"'дела? как Привет,'"
]
},
"execution_count": 20,
Expand All @@ -466,7 +502,7 @@
{
"data": {
"text/plain": [
"'like Screw you guys, I am going completely home. by the way (c)'"
"'Привет, скажем как дела?'"
]
},
"execution_count": 21,
Expand All @@ -487,7 +523,7 @@
{
"data": {
"text/plain": [
"'Screw You guys, i Am going home. (c)'"
"'привет, как дела?'"
]
},
"execution_count": 22,
Expand All @@ -508,7 +544,7 @@
{
"data": {
"text/plain": [
"'Screw you guys, I am going home. (c)'"
"'👉, как дела?'"
]
},
"execution_count": 23,
Expand All @@ -529,7 +565,7 @@
{
"data": {
"text/plain": [
"'Screw y o u guys, I am going h o m e . (c)'"
"'П р и в е т , как дела?'"
]
},
"execution_count": 24,
Expand All @@ -550,7 +586,7 @@
{
"data": {
"text/plain": [
"'Scren you guys, I am going home. (c)'"
"'Привет, как дела?'"
]
},
"execution_count": 25,
Expand All @@ -572,15 +608,15 @@
"data": {
"text/plain": [
"['Screw you guys, I am going home. (c)',\n",
" 'I am guys, Screw you going (c) home.',\n",
" 'Screw you am going (c)',\n",
" 'S c r e w you guys, I am going h o m e . ( c )',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw guys, am going (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you gugs, I am going hsme. (c)',\n",
" 'Scerw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'completely Screw you guys, I literally am going you know home. (c)']"
" 'Screw am I you guys, going home. (c)',\n",
" 'Screw you guys, I am going home. (c)']"
]
},
"execution_count": 26,
Expand All @@ -602,15 +638,15 @@
"data": {
"text/plain": [
"['Screw you guys, I am going home. (c)',\n",
" 'screwed your guys, I am long home. (c)',\n",
" 'Screw you guys, I am going home. c',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you boys, im am going hoem. (c)',\n",
" 'Screw yo guy, to am going home. (c)',\n",
" 'Screw do guys, I i guig home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw so guys, I am going homes. wo']"
" 'Screw you guys, I am going home. (c)',\n",
" 'Screw you guys, I am going home. (c)']"
]
},
"execution_count": 27,
Expand Down
Empty file added tests/__init__.py
Empty file.
Loading