@@ -13,7 +13,7 @@ def common():
13
13
"sorry" : [{"stem" :"(meg)?bocs(i(ka)?|esz|[aá](nat([aá][eé]rt)?|nat[aáo]t?|s+|s+on|j?t(ana)?))?" ,"wordclass" :"regex" },{"stem" :"elnézés" ,"wordclass" :"noun" ,"match_stem" :False },{"stem" :"sajn[aá]l(om|juk)" ,"wordclass" :"regex" },{"stem" :"s+z*o*r+[iy]+(ka)?" ,"wordclass" :"regex" }],
14
14
"lol" : [{"stem" :"(h[aei]){2,}h?" ,"wordclass" :"regex" },{"stem" :"o?(lol)+o?" ,"wordclass" :"regex" },{"stem" :"[\:\;]\-*[dp\)9]+" ,"wordclass" :"regex" ,"boundary" :False },{"stem" :"[\(8]+\-*[:;]" ,"wordclass" :"regex" ,"boundary" :False },{"stem" :"rot?fl" ,"wordclass" :"regex" },{"stem" :"vicces" ,"exc" :[{"stem" :"nem" }]},{"stem" :"nevet(tem|ek|[uü]nk)" ,"wordclass" :"regex" ,"exc" :[{"stem" :"nem" }]}],
15
15
"nvm" : [{"stem" :"felejts[ed]n?\sel" ,"wordclass" :"regex" },{"stem" :"mindegy" ,"exc" :[{"stem" :"hogy" },{"stem" :"nem" }]},{"stem" :"nem fontos" },{"stem" :"hagy(jad?|d)" ,"wordclass" :"regex" ,"inc" :[{"stem" :"jól" ,"affix" :["van" ]},{"stem" :"á" },{"stem" :"mindegy" },{"stem" :"inkább" }]},{"stem" :"ne\s(is\s)?(foglalkoz+(on|[aá]l)?|t[oö]r[oöő]dj([oö]n|[eé]l)?)\s(vel(e|[uü]k)|[ae][vz]+[ae]l)" ,"wordclass" :"regex" },{"stem" :"hagy\w+\sfigyelmen\sk[ií]v[uü]l" ,"wordclass" :"regex" ,"exc" :[{"stem" :"ne" }]},{"stem" :"nem baj" ,"max_words" :2 }],
16
- "help" : [{"stem" :"segít" ,"wordclass" :"verb" ,"prefix" :[],"exc" :[{"stem" :"nem" }]},{"stem" :"segítség" ,"wordclass" :"noun" ,"exc" :[{"stem" :"nem" }]},{"stem" :"help" ,"wordclass" :"verb" ,"prefix" :[],"exc" :[{"stem" :"nem" }]}],
16
+ "help" : [{"stem" :"segít" ,"wordclass" :"verb" ,"prefix" :[],"exc" :[{"stem" :"nem" },{ "stem" : "miben" } ]},{"stem" :"segítség" ,"wordclass" :"noun" ,"exc" :[{"stem" :"nem" }]},{"stem" :"help" ,"wordclass" :"verb" ,"prefix" :[],"exc" :[{"stem" :"nem" }]}],
17
17
"again" : [{"stem" :"[uú]j(ra|b[oó]l|at)|(meg)?ism[eé]t(l[eé]s|el(je|ni)?d?)?|m[eé]g\s?eg+y(szer|et)|megint?" ,"wordclass" :"regex" ,"exc" :[{"stem" :"vagyok" },{"stem" :"ne" ,"affix" :["m" ]}]}],
18
18
"command" : [{"stem" :"(csin[aá]l(jad?|d)|(keres|mutas|mond)[aedjos]+n?|n[eé]z[nz]?[eé]?[dl]|akaro[km]|utas[ií]t\w{1,})" ,"wordclass" :"regex" },{"stem" :"haj[cts]+(a|[aá]?[ld])\sv[eé]gre" ,"wordclass" :"regex" }],
19
19
"question" : [{"stem" :"(\?+$)|(\?+\s\w+)" ,"wordclass" :"regex" },{"stem" :"([^,][^,\S+]hogy|^hogy)(an)?" ,"wordclass" :"regex" },{"stem" :"hol" },{"stem" :"honnan" },{"stem" :"hová" },{"stem" :"hány" ,"affix" :["an" ,"at" ,"ból" ]},{"stem" :"mettől" },{"stem" :"meddig" },{"stem" :"merre" },{"stem" :"mennyi" ,"affix" :["en" ,"re" ]},{"stem" :"mi" ,"affix" :["t" ,"k" ,"ket" ,"kor" ,"korra" ,"lyen" ,"lyenek" ,"nek" ,"től" ,"kortól" ,"korra" ,"ből" ,"hez" ,"re" ,"vel" ]},{"stem" :"ki(k?(e?t|nek|[bt][oöő]l|hez|re|[kv]el)|\saz?)" ,"wordclass" :"regex" ,"exc" :[{"stem" :"\w+[ad]\ski" ,"wordclass" :"regex" }]}],
@@ -121,14 +121,14 @@ def smalltalk():
121
121
"how_are_you" : [{"stem" :"hogy vagy" },{"stem" :"j[oó](l|b+an)\svagy" ,"wordclass" :"regex" },{"stem" :"(j[oó]l|hogy)\s[eé]rzed\s(most\s)?magad(at)?" ,"wordclass" :"regex" },{"stem" :"mizu" ,"affix" :["js" ,"jság" ]},{"stem" :"hogy ityeg" },{"stem" :"(hogy\stelt\sa|milyen(\svolt\sa)?)\snapod(\svan)?" ,"wordclass" :"regex" },{"stem" :"[vw]+h*[aá]+[csz]+[aáu]+p+" ,"wordclass" :"regex" },{"stem" :"(j[oó]|milyen)\s(a\s)?kedved(\svan)?" ,"wordclass" :"regex" },{"stem" :"mi\sa(z\s[aá]bra|\sst[aá]jsz)" ,"wordclass" :"regex" },{"stem" :"hogy\s[eé]rz(i|ed)\smag[aá][dt]" ,"wordclass" :"regex" },{"stem" :"mi a" ,"inc" :[{"stem" :"helyzet" },{"stem" :"stájsz" }]},{"stem" :"mit csinálsz" ,"max_words" :3 },{"stem" :"mi a stájsz" },{"stem" :"hogy ityeg" }],
122
122
"about_name" : [{"stem" :"(mond*(ja)?\ski|mi\sa)\s(bece)nev[eé][dt](et)?" ,"wordclass" :"regex" },{"stem" :"(hogy(an)?|minek)\s(is\s)?(h[ií]v([jn][aá](la)?k|hatom)|nevez+(nek|elek))" ,"wordclass" :"regex" ,"exc" :[{"stem" :"engem" },{"stem" :"én" }]},{"stem" :"(mi?[eé]rt\s|hogy[\s\-]?hogy\s)(let+\s)?(pont\s)?(ezt?\s(let+\s)?(a\s)?|[ií]gy\s|ilyen\s)(nevez[nt]ek|h[ií]v[nt]ak|neved|nevet\s(kapt[aá][dl]|adt[aá]k))" ,"wordclass" :"regex" },{"stem" :"mi\sa\s(bece)?neved?" ,"wordclass" :"regex" ,"exc" :[{"stem" :"az|[ae]n+[ae]k|amiben?|amelyik\w*" ,"wordclass" :"regex" },{"stem" :"engem" },{"stem" :"én" }]},{"stem" :"n[eé]v(ed)?\seredete" ,"wordclass" :"regex" }],
123
123
"about_you" : [{"stem" :"(mes[eé]lj|besz[eé]lj|mondj)([eo]n)?.+?mag(ad|[aá])r[oó]l" ,"wordclass" :"regex" },{"stem" :"mutatkoz+([aá]l|on)?\s+be" ,"wordclass" :"regex" },{"stem" :"(be)?muta(koz(hat)?n[aá]l|(tn[aá]d|sd)\s.+?magad(at)?)" ,"wordclass" :"regex" },{"stem" :"([km]i(\s|\sa\s.+?)vagy te|te [km]i(\s|\sa\s.+?)vagy)" ,"wordclass" :"regex" }],
124
- "about_creator" : [{"stem" :"(ki|hogy(an)?)\s(a\s)?(k[eé]sz([ií]t([oöő]d|et+(ek)?)|[uü]lt([eé]l)?)|gazd[aá]d|programoz([oó]d|ot+|tak)|[ií]rt[aá]k?|(hoz(ot+|tak)|j[oö]t+[eé]l).+?(l[eé]tre|vil[aá]gra|k[oó]dod(at)?)|alkot([oó][dt]+|tak)|teremt(et+|[oöő]d)|(keresztelt|nevezet+|adtak)\sel|adot+\s(neked\s)?nevet)" ,"wordclass" :"regex" }],
124
+ "about_creator" : [{"stem" :"(ki|hogy(an)?)\s(a\s)?(k[eé]sz([ií]t([oöő]d|et+(ek)?)|[uü]lt([eé]l)?)|gazd[aá]d|programoz([oó]d|ot+|tak)|[ií]rt[aá]k?|(hoz(ot+|tak)|j[oö]t+[eé]l).+?(l[eé]tre|vil[aá]gra|k[oó]dod(at)?)|alkot([oó][dt]+|tak)|teremt(et+|[oöő]d)|(keresztelt|nevezet+|adtak)\sel|adot+\s(neked\s)?nevet)" ,"wordclass" :"regex" },{ "stem" : "kik?\s(k[eé]sz[ií]tet+|fejlesztet+)(ek)?" , "wordclass" : "regex" , "max_words" : 3 } ],
125
125
"about_look" : [{"stem" :"hogy(an)?\s(n[eé]zn?[eé]l\ski|mutatsz|festesz)" ,"wordclass" :"regex" },{"stem" :"(k[uü]ldj|mutas+).+?(k[eé]pet|fot[oó]t|sz?elfie?t)\smagadr[oó]l" ,"wordclass" :"regex" },{"stem" :"(k[uü]ldj|mutas+)\smagadr[oó]l.+?(k[eé]pet|fot[oó]t|sz?elfie?t)" ,"wordclass" :"regex" },{"stem" :"(van|milyen)\s(az?\s)?(arcod|kin[eé]zeted)" ,"wordclass" :"regex" },{"stem" :"szép vagy" }],
126
126
"about_age" : [{"stem" :"mennyi idős vagy" },{"stem" :"hány éves vagy" },{"stem" :"melyik évben születtél" },{"stem" :"mikor születtél" },{"stem" :"(melyik\s[eé]vben|mikor)\sk[eé]sz([uü]lt[eé]l|[ií]tet+ek)" ,"wordclass" :"regex" },{"stem" :"(h[aá]ny(adik|ban)|mikor\s(van|[uü]n+epled)\s?a?)\ssz[uü]l(et[eé]s|i)napod(at)?" ,"wordclass" :"regex" },{"stem" :"h[aá]ny\s[eé]vesnek\s.+?\smagad(at)?" ,"wordclass" :"regex" },{"stem" :"sz[uü]l(et[eé]s)?i?napod(at)?\s(h[aá]nyadik[aá]n|mikor|melyik)" ,"wordclass" :"regex" }],
127
127
"about_zodiac" : [{"stem" :"(neked\s)?mi\sa\s(horoszk[oó]pod|csil+agjegyed)" ,"wordclass" :"regex" },{"stem" :"milyen jegyben születtél" },{"stem" :"a\s(te\s)?(horoszk[oó]pod|csil+agjegyed)\smi(csoda)?" ,"wordclass" :"regex" },{"stem" :"milyen\sjegyben\ssz[uü]let+\w+" ,"wordclass" :"regex" }],
128
128
"about_location" : [{"stem" :"(hol|helyen)\s(k[eé]sz[uü]lt[eé]l|k[eé]sz[ií]tet+ek|sz[uü]let+[eé]l|(hoztak|j[oö]t+[eé]l).+?l[eé]tre)" ,"wordclass" :"regex" },{"stem" :"hon+an\s(sz[aá]rmazol|[ií]rsz|val[oó]\svagy)" ,"wordclass" :"regex" },{"stem" :"ho(n+an|l)\svagy\s(most\s)?(helyileg|most|pontosan)" ,"wordclass" :"regex" },{"stem" :"(hol\s|mer+e\s)(laksz|(van|az?).+?ot+honod)" ,"wordclass" :"regex" },{"stem" :"hol vagy" ,"max_words" :3 }],
129
129
"about_family" : [{"stem" :"ki(k|t|ket)?\s(az?\s|tartasz\sa\s)?(te\s)?(csal[aá]dod(nak)?|sz[uü]l(t|et+[eé]l)|sz[uü]leid(nek)?|([eé]des)?(any(uk)?[aá]d|ap(uk)?[aá]d)(nak)?)" ,"wordclass" :"regex" },{"stem" :"csal[aá]dban\s([eé]l(sz|tek)|sz[uü]let+[eé]l)" ,"wordclass" :"regex" },{"stem" :"(h[aá]ny|van(nak)?)\stestv[eé]rei?d" ,"wordclass" :"regex" },{"stem" :"(kik?|van(n?ak)?[\-\s]?e?)(\sa)?(\shoz+[aá]d?\s?tartoz[oó]i?d|csal[aá]dod)" ,"wordclass" :"regex" }],
130
130
"about_software" : [{"stem" :"(hogy(hogy|an)?|mit[oöő]l).+?(m[uüű]k[oö]dsz|(tudsz |vagy k[eé]pes )?(meg)?[eé]rte(sz|d|ni)\,? (meg )?(hogy )?(a?mit mond(ok|tam)|a?mit [ií]r(ok|tam)|engem))" ,"wordclass" :"regex" },{"stem" :"mi(jen|lyen|en|\s?f[eé]le|\s?fajta)\sfekete\s?m[aá]gia" ,"wordclass" :"regex" },{"stem" :"neur[aá]lis\sh[aá]l[oó]\w*" ,"wordclass" :"regex" ,"inc" :[{"stem" :"vagy" },{"stem" :"te" },{"stem" :"működ" ,"wordclass" :"verb" }]}],
131
- "about_skills" : [{"stem" :"mi(lyen|(ke)?t|k?re)\s(funkci[oó](id?|kat)\s|dolgok(at|ra)\s|tr[uü]k+([oö]k(et|re)|jeid?)\s|parancsok(at|ra)\s)?(tud(sz|n[aá]l)?\s(csin[aá]lni|mutatni)?|ismer(sz)?|(vagy\s|van\s)?(k[eé]pes|(be|meg)?tan[ií]tva)|tan[ií]tot+[aá]k\s(be|neked|meg)?|(k[eé]pes+[eé]gei?d?|tulajdons[aá]g(o|ai)d?)\svan(nak)?)" ,"wordclass" :"regex" ,"exc" :[{"stem" :"mond" ,"wordclass" :"verb" }]},{"stem" :"mihez ért" ,"affix" :["esz" ]},{"stem" :"mi((ke)?t|k?r[oöő]l)\s(lehet\s|szabad\s|tudok\s)?k[eé]rdez+h?e\w+" ,"wordclass" :"regex" },{"stem" :"miben tudsz" },{"stem" :"k[eé]rdez+(het)?(ek|ni)\st[oöő]led" ,"wordclass" :"regex" }],
131
+ "about_skills" : [{"stem" :"mi(lyen|(ke)?t|k?re)\s(funkci[oó](id?|kat)\s|dolgok(at|ra)\s|tr[uü]k+([oö]k(et|re)|jeid?)\s|parancsok(at|ra)\s)?(tud(sz|n[aá]l)?\s(csin[aá]lni|mutatni)?|ismer(sz)?|(vagy\s|van\s)?(k[eé]pes|(be|meg)?tan[ií]tva)|tan[ií]tot+[aá]k\s(be|neked|meg)?|(k[eé]pes+[eé]gei?d?|tulajdons[aá]g(o|ai)d?)\svan(nak)?)" ,"wordclass" :"regex" ,"exc" :[{"stem" :"mond" ,"wordclass" :"verb" }]},{"stem" :"mihez ért" ,"affix" :["esz" ]},{"stem" :"mi((ke)?t|k?r[oöő]l)\s(lehet\s|szabad\s|tudok\s)?k[eé]rdez+h?e\w+" ,"wordclass" :"regex" },{"stem" :"miben tudsz" },{"stem" :"k[eé]rdez+(het)?(ek|ni)\st[oöő]led" ,"wordclass" :"regex" },{ "stem" : "mi(ben|vel)\s?tud(sz|n[aá]l)\sseg[ií]teni" , "wordclass" : "regex" } ],
132
132
"about_topics" : [{"stem" :"mir[oöő]l\s.*?besz[eé]lge[st]\w+" ,"wordclass" :"regex" },{"stem" :"milyen\st[eé]m[aá][bk]*r?[aoó][lnt]" ,"wordclass" :"regex" }],
133
133
"about_thoughts" : [{"stem" :"mi(n|re)?\s(gondol(kodsz|ko[dz]ol|sz)|agyalsz|t[oö]prenge?sz|j[aá]r\s(az?\s)?(fejed|agyad)(b[ae]n?)?)" ,"wordclass" :"regex" }],
134
134
"about_favorite" : [{"stem" :"melyik" ,"inc" :[{"stem" :"kedvenc" ,"affix" :["ed" ]},{"stem" :"szeret" ,"affix" :["i" ,"ed" ],"match_stem" :False }]}],
@@ -139,7 +139,7 @@ def smalltalk():
139
139
"are_you_busy" : [{"stem" :"elfoglalt" ,"inc" :[{"stem" :"vagy" }]},{"stem" :"r[aá]m?\s?[eé]r(n[eé]l|sz)(\smost)?(\segy)?(\skicsit|\skis\s\w+|\svalamen+yi\w*)?" ,"wordclass" :"regex" },{"stem" :"(van|volna)\s(most\s)?(r[aá]m?\s)?(most\s)?(egy\s)?(kis\s|kev[eé]s\s|valamen+yi\s)?(szabad\s?)?id[oöő]d(\sr[aá]m)?" ,"wordclass" :"regex" },{"stem" :"sok dolgod van" }],
140
140
"are_you_lying" : [{"stem" :"hazud" ,"wordclass" :"verb" },{"stem" :"nem mondt[aá][dl]\s((el|meg)\saz\s)?igaz(at|s[aá]got)" ,"wordclass" :"regex" }],
141
141
"are_you_serious" : [{"stem" :"(nem?|csak)\s(vic+el(sz|j)?|mond+(od|ja)?|ideges[ií]ts(en)?)" ,"wordclass" :"regex" },{"stem" :"(komolyan|t[eé]nyleg)\s?([uúií]gy\s|azt\s)?((mond|gondol|[ií]r)(ja|od|tad?)|hisz(i|ed)|hit+ed?)" ,"wordclass" :"regex" },{"stem" :"biztos(an)?\s(vagy\s)?(\w+\s)?(ben+e|eb+en|mond(ta|o)d|mond[jt]a)" ,"wordclass" :"regex" },{"stem" :"ezt?\s(most\s)?komoly(an)?" ,"wordclass" :"regex" },{"stem" :"viccelsz" ,"max_words" :1 }],
142
- "can_you_hear_me" : [{"stem" :"(olvas+a|hal+ja|n[eé]zi|van\sit+)(\sezt)?\s(vala|b[aá]r)ki(\sis)?" ,"wordclass" :"regex" },{"stem" :"(hal+(asz|od)|l[aá]t(sz|od)|vesze[ld])\s(engem|a?mit\s(mondok|[ií]rok|k[eé]rdezek))" ,"wordclass" :"regex" },{"stem" :"valaki\s(hal+(ja)?\s|olvas+a|figyeli?(\sar+a)?)\sa?mit\s(ide\s?|it+\s)?([ií]rok|mondok|k[eé]rdezek)" ,"wordclass" :"regex" },{"stem" :"felfogtad" ,"max_words" :3 },{"stem" :"itt" ,"inc" :[{"stem" :"vagy" },{"stem" :"van" }],"max_words" :3 },{"stem" :"halló" ,"max_words" :3 },{"stem" :"hallasz" ,"max_words" :3 },{"stem" :"mikrofon próba" }],
142
+ "can_you_hear_me" : [{"stem" :"(olvas+a|hal+ja|n[eé]zi|van\sit+)(\sezt)?\s(vala|b[aá]r)ki(\sis)?" ,"wordclass" :"regex" },{"stem" :"(hal+(asz|od)|l[aá]t(sz|od)|vesze[ld])\s(engem|a?mit\s(mondok|[ií]rok|k[eé]rdezek))" ,"wordclass" :"regex" },{"stem" :"valaki\s(hal+(ja)?\s|olvas+a|figyeli?(\sar+a)?)\sa?mit\s(ide\s?|it+\s)?([ií]rok|mondok|k[eé]rdezek)" ,"wordclass" :"regex" },{"stem" :"felfogtad" ,"max_words" :3 },{"stem" :"itt" ,"inc" :[{"stem" :"vagy" },{"stem" :"van" }],"max_words" :3 },{"stem" :"halló" ,"max_words" :3 },{"stem" :"hallasz" ,"max_words" :3 },{"stem" :"mikrofon próba" },{ "stem" : "miért nem válaszolsz" } ],
143
143
"can_you_learn" : [{"stem" :"(k[eé]pes(\svagy)?|tud(sz)?)\stanulni" ,"wordclass" :"regex" },{"stem" :"tanulsz\s(is|[ae].+?b[oóöő]l)" ,"wordclass" :"regex" },{"stem" :"[dln][aáeéo][km]\s(be|meg)?tan[ií]tani\b " ,"wordclass" :"regex" ,"boundary" :False },{"stem" :"(lehet|tudlak|tudom)\s(t[eé]ged|[oö]nt)?\stan[ií]tani" ,"wordclass" :"regex" }],
144
144
"can_you_understand_me" :[{"stem" :"(meg)?[eé]rt(e(d|sz|t+ed?)|i)\,?((\shogy)?\sa?mit\s([ií]r|mond)\w+|\smagyarul)" ,"wordclass" :"regex" }],
145
145
"contact" : [{"stem" :"mi(lyen)?\s(.+?\s)?(e\-?mail\s?)?c[ií]me[dn]?" ,"wordclass" :"regex" },{"stem" :"elérhetőség" ,"wordclass" :"noun" },{"stem" :"elér" ,"wordclass" :"verb" ,"inc" :[{"stem" :"önt" },{"stem" :"téged" }]}],
0 commit comments