Datasets:
fold
int32
1
5
| subfold
string
| words
sequence
| segments
sequence
| pos_tags
sequence
|
---|---|---|---|---|
4 | "A" | [
"ููู",
"ูู
ุง",
"ุชุญุจ",
"ุญุฏ",
"ู
ู",
"ููุจู",
"ูุทูุน",
"ูุงุทู",
"ููู",
"ูู
ุง",
"ุชูุนุจ",
"ุนูู",
"ูุงุญุฏ",
"ูุทูุน",
"ุจูุญุจู",
"ููู",
"ุงููู",
"ููู
ูุช",
"ุนููู",
"ุงูุช",
"ู
ุด",
"ุทุงููู",
"ูุงููู",
"ูุชู
ูุช",
"ุนููู",
"ู
ุด",
"ุทุงููู",
"ุนุฌุจุช",
"ูู",
"ูุง",
"ุฒู
ู",
"EOS"
] | [
"ููู",
"ูู
ุง",
"ุชุญุจ",
"ุญุฏ",
"ู
ู",
"ููุจ+ู",
"ูุทูุน",
"ูุงุทู",
"ููู",
"ูู
ุง",
"ุชูุนุจ",
"ุนูู",
"ูุงุญุฏ",
"ูุทูุน",
"ุจ+ูุญุจ+ู",
"ููู",
"ุงููู",
"ู+ูู
ูุช",
"ุนูู+ู",
"ุงูุช",
"ู
ุด",
"ุทุงูู+ู",
"ู+ุงููู",
"ู+ุชู
ูุช",
"ุนูู+ู",
"ู
ุด",
"ุทุงูู+ู",
"ุนุฌุจ+ุช",
"ู+ู",
"ูุง",
"ุฒู
ู",
"EOS"
] | [
"PART",
"PART",
"V",
"NOUN",
"PREP",
"NOUN+PRON",
"V",
"ADJ",
"PART",
"PART",
"V",
"PREP",
"NOUN",
"V",
"PROG_PART+V+PRON",
"PART",
"PART",
"FUT_PART+V",
"PREP+PRON",
"PRON",
"PART",
"ADJ+PRON",
"CONJ+PART",
"FUT_PART+V",
"PREP+PRON",
"PART",
"ADJ+PRON",
"V+PRON",
"PREP+PRON",
"PART",
"NOUN",
"EOS"
] |
4 | "A" | [
"ุนุงุฑู",
"ุจููููู",
"ุงูู",
"\"",
"ุฅุฐุง",
"ุฃุฎุทุฃุช",
"ูุฃุญุณู",
"\"",
".",
".",
"ูุนูู",
"ู
ุชุนูุฏุด",
".",
".",
"ู",
"ู
ุชุณุฃูุด",
"ู
ูู",
"ุงููู",
"ุจููููู",
".",
"EOS"
] | [
"ุนุงุฑู",
"ุจ+ููู+ู+ู",
"ุงูู",
"\"",
"ุฅุฐุง",
"ุฃุฎุทุฃ+ุช",
"ู+ุฃุญุณู",
"\"",
".",
".",
"ูุนูู",
"ู
+ุชุนูุฏ+ุด",
".",
".",
"ู",
"ู
+ุชุณุฃู+ุด",
"ู
ูู",
"ุงููู",
"ุจ+ููู+ู+ู",
".",
"EOS"
] | [
"ADJ",
"PROG_PART+V+PREP+PRON",
"PART",
"PUNC",
"PART",
"V+PRON",
"CONJ+V",
"PUNC",
"PUNC",
"PUNC",
"V",
"PART+V+NEG_PART",
"PUNC",
"PUNC",
"CONJ",
"PART+V+NEG_PART",
"PART",
"PART",
"PROG_PART+V+PREP+PRON",
"PUNC",
"EOS"
] |
3 | "A" | [
"ุงูุญู
ุฏ",
"ููู",
"ูุง",
"ุฌุฏุนุงู",
"ุงููุฑุณุงู",
"ุงููู",
"ุงุชู
ุณููุง",
"ุนูุฏ",
"ุณุชุงุฏ",
"ุงููุงูุฑุฉ",
"ุฎุฏูุง",
"ุงุฎูุงุก",
"ุณุจูู",
"#ุฑุจูุง_ูุจูุฑ",
".",
".",
"ุจูุงููุง",
"7",
"ุณููู",
"ุธูู
",
"ู",
"ููุฑ",
"ุฏู",
"ูุฑุถู",
"ู
ูู",
"ุ",
"ุ",
"ุ",
"ุ",
"#ุงูุญู
ุฏ_ููู",
"EOS"
] | [
"ุงู+ุญู
ุฏ",
"ู+ุงููู",
"ูุง",
"ุฌุฏุนุงู",
"ุงู+ูุฑุณุงู",
"ุงููู",
"ุงุชู
ุณู+ูุง",
"ุนูุฏ",
"ุณุชุงุฏ",
"ุงู+ูุงูุฑ+ุฉ",
"ุฎุฏ+ูุง",
"ุงุฎูุงุก",
"ุณุจูู",
"#ุฑุจูุง_ูุจูุฑ",
".",
".",
"ุจูุง+ู+ูุง",
"7",
"ุณู+ูู",
"ุธูู
",
"ู",
"ููุฑ",
"ุฏู",
"ูุฑุถู",
"ู
ูู",
"ุ",
"ุ",
"ุ",
"ุ",
"#ุงูุญู
ุฏ_ููู",
"EOS"
] | [
"DET+NOUN",
"PREP+NOUN",
"PART",
"NOUN",
"DET+NOUN",
"PART",
"V+PRON",
"NOUN",
"NOUN",
"DET+NOUN+NSUFF",
"V+PRON",
"NOUN",
"NOUN",
"HASH",
"PUNC",
"PUNC",
"V+PREP+PRON",
"NUM",
"NOUN+NSUFF",
"NOUN",
"CONJ",
"NOUN",
"PRON",
"V",
"PART",
"PUNC",
"PUNC",
"PUNC",
"PUNC",
"HASH",
"EOS"
] |
1 | "A" | [
"ุจุญุณ",
"ุจุดุฎุตูุชู",
"ุงููููุฉ",
"ูู
ุง",
"ุงููู",
"ูุงุฎููุง",
"ุงุนู
ู",
"ุญุงุฌุฉ",
".",
".",
"ู",
"ูุนู
ููุง",
".",
".",
"ุญุชู",
"ูู",
"ุฑุฎู
",
"ู",
"ูุงู",
"ูุฃ",
".",
".",
"ุจุญุณ",
"ุงูู",
"ุดุฎุตูุฉ",
"ูุฏุง",
"ู",
"ุจุชุณู
ุน",
"ููุงู
ู",
"^_^",
"EOS"
] | [
"ุจ+ุญุณ",
"ุจ+ุดุฎุตู+ุช+ู",
"ุงู+ููู+ุฉ",
"ูู
ุง",
"ุงููู",
"ู+ุงุฎู+ูุง",
"ุงุนู
ู",
"ุญุงุฌ+ุฉ",
".",
".",
"ู",
"ูุนู
ู+ูุง",
".",
".",
"ุญุชู",
"ูู",
"ุฑุฎู
",
"ู",
"ูุงู",
"ูุฃ",
".",
".",
"ุจ+ุญุณ",
"ุงู+ู",
"ุดุฎุตู+ุฉ",
"ูุฏุง",
"ู",
"ุจ+ุชุณู
ุน",
"ููุงู
+ู",
"^_^",
"EOS"
] | [
"PROG_PART+V",
"PREP+NOUN+NSUFF+PRON",
"DET+ADJ+NSUFF",
"PART",
"V",
"PREP+NOUN+PRON",
"V",
"NOUN+NSUFF",
"PUNC",
"PUNC",
"CONJ",
"V+PRON",
"PUNC",
"PUNC",
"PART",
"PART",
"V",
"CONJ",
"V",
"PART",
"PUNC",
"PUNC",
"PROG_PART+V",
"PART+PRON",
"NOUN+NSUFF",
"ADV",
"CONJ",
"PROG_PART+V",
"NOUN+PRON",
"EMOT",
"EOS"
] |
5 | "A" | [
"@ahmedabodsheesh",
"ูุง",
"ุจุงุดุง",
"ุฏู",
"ู
ุด",
"ู
ุญุชุงุฌู",
"ุฏุฑุงุณู",
"ุฏู",
"ุจุชุจูู",
"ู
ููุจู",
"ุนูุฏู",
"ู
ุซูุง",
"ุนููุงุก",
"ุตุงุฏู",
"ู",
"ุตููุช",
"ุญุฌุงุฒู",
"ุฏูู",
"ุชููููุง",
"ุนูู",
"ุงุณุชุงุฐูู
",
"ุตููุช",
"ุงูุดุฑูู",
"ูุจูุฑูู
",
"EOS"
] | [
"@ahmedabodsheesh",
"ูุง",
"ุจุงุดุง",
"ุฏู",
"ู
ุด",
"ู
ุญุชุงุฌ+ู",
"ุฏุฑุงุณ+ู",
"ุฏู",
"ุจ+ุชุจูู",
"ู
ููุจ+ู",
"ุนูุฏ+ู",
"ู
ุซู+ุง",
"ุนููุงุก",
"ุตุงุฏู",
"ู",
"ุตููุช",
"ุญุฌุงุฒู",
"ุฏูู",
"ุชููู+ูุง",
"ุนูู",
"ุงุณุชุงุฐ+ูู
",
"ุตููุช",
"ุงู+ุดุฑูู",
"ูุจูุฑ+ูู
",
"EOS"
] | [
"MENTION",
"PART",
"NOUN",
"PRON",
"PART",
"ADJ+NSUFF",
"NOUN+NSUFF",
"PRON",
"PROG_PART+V",
"NOUN+NSUFF",
"NOUN+PRON",
"NOUN+CASE",
"NOUN",
"NOUN",
"CONJ",
"NOUN",
"NOUN",
"PRON",
"V+PRON",
"PREP",
"NOUN+PRON",
"NOUN",
"DET+NOUN",
"ADJ+PRON",
"EOS"
] |
2 | "A" | [
"ู",
"ูู",
"ูู",
"ู
ุญุงู
ูู",
"ููุนุจูุฑููุง",
"ุจุนุฏ",
"ุงุนุชูุงู",
"ูุชูุฏูุฏ",
"ุงูู
ุญุงู
ูู",
"ุงููู",
"ุจูุฏุงูุนูุง",
"ุนู",
"ุงูู
ุธููู
ูู",
"ุ",
"ุ",
"ุ",
"ุฏู",
"ุบูุฑ",
"ุงูู
ุญุงู
ู",
"ุงููู",
"ูุชููุง",
"ูุงูุฏุชู",
"!",
"@mohamedwaked",
"@ANohan",
"EOS"
] | [
"ู",
"ูู",
"ูู",
"ู
ุญุงู
+ูู",
"ู+ูุนุจุฑ+ู+ูุง",
"ุจุนุฏ",
"ุงุนุชูุงู",
"ู+ุชูุฏูุฏ",
"ุงู+ู
ุญุงู
+ูู",
"ุงููู",
"ุจ+ูุฏุงูุน+ูุง",
"ุนู",
"ุงู+ู
ุธููู
+ูู",
"ุ",
"ุ",
"ุ",
"ุฏู",
"ุบูุฑ",
"ุงู+ู
ุญุงู
ู",
"ุงููู",
"ูุชู+ูุง",
"ูุงูุฏ+ุช+ู",
"!",
"@mohamedwaked",
"@ANohan",
"EOS"
] | [
"CONJ",
"PRON",
"PREP",
"NOUN+NSUFF",
"FUT_PART+V+PRON+PRON",
"NOUN",
"NOUN",
"CONJ+NOUN",
"DET+NOUN+NSUFF",
"PART",
"PROG_PART+V+PRON",
"PREP",
"DET+NOUN+NSUFF",
"PUNC",
"PUNC",
"PUNC",
"PRON",
"NOUN",
"DET+NOUN",
"PART",
"V+PRON",
"NOUN+NSUFF+PRON",
"PUNC",
"MENTION",
"MENTION",
"EOS"
] |
1 | "A" | [
"ู
ุนุธู
",
"ุงูุญุงุฌุงุช",
"ุงููู",
"ู
ุจููุฏุฑุด",
"ูุญูููุง",
"ุจููุฌู",
"ููุชุจูุง",
"ููุง",
"ุนูู",
"ุงูุฃูู",
"ุจุชุฎูู",
"ุนูุง",
"ุดููุฉ",
".",
"EOS"
] | [
"ู
ุนุธู
",
"ุงู+ุญุงุฌ+ุงุช",
"ุงููู",
"ู
+ุจ+ููุฏุฑ+ุด",
"ูุญูู+ูุง",
"ุจ+ููุฌู",
"ููุชุจ+ูุง",
"ููุง",
"ุนูู",
"ุงู+ุฃูู",
"ุจ+ุชุฎูู",
"ุนู+ุง",
"ุดูู+ุฉ",
".",
"EOS"
] | [
"NOUN",
"DET+NOUN+NSUFF",
"PART",
"PART+PROG_PART+V+NEG_PART",
"V+PRON",
"PROG_PART+V",
"V+PRON",
"ADV",
"PREP",
"DET+ADJ",
"PROG_PART+V",
"PREP+PRON",
"NOUN+NSUFF",
"PUNC",
"EOS"
] |
5 | "A" | [
"ุงุญูุง",
"ุจูุฒุนู",
"ูู
ุง",
"ุฑุจูุง",
"ูุจุชูููุง",
"ุฃู",
"ุชุญุตููุง",
"ุญุงุฌู",
"ูุญุดู",
"!",
"ู
ุน",
"ุงู",
"ุฑุจูุง",
"ุฅุฐุง",
"ุญุจ",
"ุนุจุฏ",
"ุงุจุชูุงู",
"ูุชูููุฑ",
"ุนู",
"ุฐููุจู",
"-",
"ูุนูู",
"ุฎุงู",
"ูู",
"ุฑุจูุง",
"ู
ุด",
"ุงุจุชูุงู",
".",
"EOS"
] | [
"ุงุญูุง",
"ุจ+ูุฒุนู",
"ูู
ุง",
"ุฑุจ+ูุง",
"ูุจุชูู+ูุง",
"ุฃู",
"ุชุญุต+ู+ูุง",
"ุญุงุฌ+ู",
"ูุญุด+ู",
"!",
"ู
ุน",
"ุงู",
"ุฑุจ+ูุง",
"ุฅุฐุง",
"ุญุจ",
"ุนุจุฏ",
"ุงุจุชูุง+ู",
"ู+ุชูููุฑ",
"ุนู",
"ุฐููุจ+ู",
"-",
"ูุนูู",
"ุฎุงู",
"ูู",
"ุฑุจ+ูุง",
"ู
ุด",
"ุงุจุชูุง+ู",
".",
"EOS"
] | [
"PRON",
"PROG_PART+V",
"PART",
"NOUN+PRON",
"V+PRON",
"CONJ",
"V+PREP+PRON",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PUNC",
"NOUN",
"PART",
"NOUN+PRON",
"PART",
"V",
"NOUN",
"V+PRON",
"PREP+NOUN",
"PREP",
"NOUN+PRON",
"PUNC",
"ADV",
"V",
"PART",
"NOUN+PRON",
"PART",
"V+PRON",
"PUNC",
"EOS"
] |
4 | "A" | [
"(",
"6",
")",
"ู
ุด",
"ุนุงุฑู",
"ููู",
"ุจุณ",
"ุงูููู
ุฉ",
"ุงููู",
"ุนู
ุฑู",
"ู
ุง",
"ูุชูุฏู
",
"ุนูููุง",
"ุงูููู
ุฉ",
"ุงููู",
"ุฃูุช",
"ูุณุฉ",
"ู
ูููุชูุงุด",
".",
".",
".",
"ุจุณ",
"ููุฃุณู",
"ูุงุฒู
",
"ูุฌู",
"ุนููู",
"ููุช",
"ู",
"ุชููููุง",
"EOS"
] | [
"(",
"6",
")",
"ู
ุด",
"ุนุงุฑู",
"ููู",
"ุจุณ",
"ุงู+ููู
+ุฉ",
"ุงููู",
"ุนู
ุฑ+ู",
"ู
ุง",
"ู+ุชูุฏู
",
"ุนูู+ูุง",
"ุงู+ููู
+ุฉ",
"ุงููู",
"ุฃูุช",
"ูุณ+ุฉ",
"ู
+ููู+ุช+ูุง+ุด",
".",
".",
".",
"ุจุณ",
"ู+ุงู+ุฃุณู",
"ูุงุฒู
",
"ูุฌู",
"ุนูู+ู",
"ููุช",
"ู",
"ุชููู+ูุง",
"EOS"
] | [
"PUNC",
"NUM",
"PUNC",
"PART",
"ADJ",
"PART",
"ADV",
"DET+NOUN+NSUFF",
"PART",
"NOUN+PRON",
"PART",
"FUT_PART+V",
"PREP+PRON",
"DET+NOUN+NSUFF",
"PART",
"PRON",
"ADV+NSUFF",
"PART+V+PRON+PRON+NEG_PART",
"PUNC",
"PUNC",
"PUNC",
"PART",
"PREP+DET+NOUN",
"ADJ",
"V",
"PREP+PRON",
"NOUN",
"CONJ",
"V+PRON",
"EOS"
] |
3 | "A" | [
"ุงุถุญู",
"ูุจูุงุด",
"ุงูุชูุดูุฑุฉ",
"ุชูุณูู",
"ุดูู",
"ุงูุถุญูุฉ",
"ูุดู",
"ูููุฑู
ุด",
"ุนุงููุงุถู",
"ููุชุนุฌุฒ",
"ุจุฏุฑู",
"ุฎููู",
"ูุงุตุญ",
"ูุงุฑู
ู",
"ูู
ูู
ู",
"ูุฑุง",
"ุถูุฑู",
"ูุงูุฑุญ",
"ุฏู",
"ุงูุงูุงู
",
"ุจุชููุช",
"ูุชุนุฏู",
"ูุงูุนู
ุฑ",
"ุจูุฌุฑู",
"EOS"
] | [
"ุงุถุญู",
"ู+ุจูุงุด",
"ุงู+ุชูุดูุฑ+ุฉ",
"ุชูุณู+ู",
"ุดูู",
"ุงู+ุถุญู+ุฉ",
"ูุด+ู",
"ู+ููุฑู
ุด",
"ุน+ุงู+ูุงุถู",
"ู+ู+ุชุนุฌุฒ",
"ุจุฏุฑู",
"ุฎู+ู+ู",
"ูุงุตุญ",
"ู+ุงุฑู
+ู",
"ูู
ูู
+ู",
"ูุฑุง",
"ุถูุฑ+ู",
"ู+ุงูุฑุญ",
"ุฏู",
"ุงู+ุงูุงู
",
"ุจ+ุชููุช",
"ู+ุชุนุฏู",
"ู+ุงู+ุนู
ุฑ",
"ุจ+ูุฌุฑู",
"EOS"
] | [
"V",
"CONJ+PART",
"DET+NOUN+NSUFF",
"V+PRON",
"NOUN",
"DET+NOUN+NSUFF",
"NOUN+PRON",
"FUT_PART+V",
"PREP+DET+NOUN",
"CONJ+FUT_PART+V",
"ADJ",
"V+PRON+PRON",
"ADJ",
"CONJ+V+PRON",
"NOUN+PRON",
"NOUN",
"NOUN+PRON",
"CONJ+V",
"PRON",
"DET+NOUN",
"PROG_PART+V",
"CONJ+V",
"CONJ+DET+NOUN",
"PROG_PART+V",
"EOS"
] |
3 | "A" | [
"ู
ุด",
"ู
ุนูู",
"ุงู",
"ุญุฏ",
"ุจูุถุญู",
"ูุชูุฑ",
"ูุจูู",
"ุณุนูุฏ",
"ูู
ูู",
"ุจูุถุญู",
"ูุชูุฑ",
"ู
ู",
"ูู
ู",
"ุงููุจูุฑ",
"ุจูุถุญู",
"ุนุดุงู",
"ูุจุนุฏ",
"ุนู",
"ุญุฒูู",
"ููุนู
ู",
"ููุณู",
"ูุงุณูู",
"EOS"
] | [
"ู
ุด",
"ู
ุนูู",
"ุงู",
"ุญุฏ",
"ุจ+ูุถุญู",
"ูุชูุฑ",
"ูุจูู",
"ุณุนูุฏ",
"ูู
ูู",
"ุจ+ูุถุญู",
"ูุชูุฑ",
"ู
ู",
"ูู
+ู",
"ุงู+ูุจูุฑ",
"ุจ+ูุถุญู",
"ุนุดุงู",
"ูุจุนุฏ",
"ุนู",
"ุญุฒู+ู",
"ู+ูุนู
ู",
"ููุณ+ู",
"ูุงุณู+ู",
"EOS"
] | [
"PART",
"NOUN",
"PART",
"NOUN",
"PROG_PART+V",
"ADJ",
"V",
"ADJ",
"V",
"PROG_PART+V",
"ADJ",
"PREP",
"NOUN+PRON",
"DET+ADJ",
"PROG_PART+V",
"PART",
"V",
"PREP",
"NOUN+PRON",
"CONJ+V",
"NOUN+PRON",
"ADJ+PRON",
"EOS"
] |
5 | "A" | [
"ุงูุงูู",
"ููุง",
"ุจุนุฏ",
"ู
ุงุญุฏ",
"ูุงุฎุฏ",
"ุงุฎูุงุก",
"ุณุจูู",
"ุงู",
"ุจุฑุงุกุฉ",
"ูุฏุนู",
"ุงู",
"ุงูููุงุจุฉ",
"ู
ุงุชุณุชุฃููุด",
"ุฏูููุชู",
"ุจูุฏุนู",
"ูู
ุงู",
"ุงู",
"ุงู
ู",
"ุงูุฏููุฉ",
"ู
ุง",
"ูุงุฎุฏูููุด",
"#ุณูุณู_ูุงูุฏ",
"#ุจูุงูุง",
"EOS"
] | [
"ุงู+ุงูู",
"ูู+ุง",
"ุจุนุฏ",
"ู
ุง+ุญุฏ",
"ูุงุฎุฏ",
"ุงุฎูุงุก",
"ุณุจูู",
"ุงู",
"ุจุฑุงุก+ุฉ",
"ูุฏุนู",
"ุงู",
"ุงู+ููุงุจ+ุฉ",
"ู
ุง+ุชุณุชุฃูู+ุด",
"ุฏูููุชู",
"ุจ+ูุฏุนู",
"ูู
ุงู",
"ุงู",
"ุงู
ู",
"ุงู+ุฏูู+ุฉ",
"ู
ุง",
"ูุงุฎุฏ+ู+ูู+ุด",
"#ุณูุณู_ูุงูุฏ",
"#ุจูุงูุง",
"EOS"
] | [
"DET+NUM",
"V+PRON",
"NOUN",
"PART+NOUN",
"V",
"NOUN",
"NOUN",
"CONJ",
"NOUN+NSUFF",
"V",
"PART",
"DET+NOUN+NSUFF",
"PART+V+NEG_PART",
"NOUN",
"PROG_PART+V",
"ADV",
"PART",
"NOUN",
"DET+NOUN+NSUFF",
"PART",
"V+PRON+PRON+NEG_PART",
"HASH",
"HASH",
"EOS"
] |
5 | "A" | [
"ู
ููุด",
"ุงูุญุด",
"ู
ู",
"ุงูู",
"ุชููู",
"ุดุฎุต",
"ู
ุฒุงุฌู",
"ุชูุงุตูู",
"ุตุบูุฑุฉ",
"ู
ู
ูู",
"ุชุฎููู",
"ุทุงูุฑ",
"ู
ู",
"ุงููุฑุญุฉ",
".",
".",
".",
"ูููู
ุฉ",
"ุตุบูุฑุฉ",
"ุจุฑุฏู",
"ุชูุฒูู",
"ูุณุงุจุน",
"ุงุฑุถ",
"ูุชูุฆุจู",
".",
".",
"!",
"EOS"
] | [
"ู
+ูู+ุด",
"ุงูุญุด",
"ู
ู",
"ุงู+ู",
"ุชููู",
"ุดุฎุต",
"ู
ุฒุงุฌู",
"ุชูุงุตูู",
"ุตุบูุฑ+ุฉ",
"ู
ู
ูู",
"ุชุฎู+ู+ู",
"ุทุงูุฑ",
"ู
ู",
"ุงู+ูุฑุญ+ุฉ",
".",
".",
".",
"ู+ููู
+ุฉ",
"ุตุบูุฑ+ุฉ",
"ุจุฑุฏู",
"ุชูุฒู+ู",
"ู+ุณุงุจุน",
"ุงุฑุถ",
"ู+ุชูุฆุจ+ู",
".",
".",
"!",
"EOS"
] | [
"PART+PREP+NEG_PART",
"ADJ",
"PREP",
"PART+PRON",
"V",
"NOUN",
"ADJ",
"NOUN",
"ADJ+NSUFF",
"ADJ",
"V+PRON+PRON",
"ADJ",
"PREP",
"DET+NOUN+NSUFF",
"PUNC",
"PUNC",
"PUNC",
"CONJ+NOUN+NSUFF",
"ADJ+NSUFF",
"ADV",
"V+PRON",
"PREP+NUM",
"NOUN",
"CONJ+V+PRON",
"PUNC",
"PUNC",
"PUNC",
"EOS"
] |
4 | "A" | [
"ุนุงุฑู",
"ุงูุช",
"ุงูุตุญุงุจ",
"ุงูุฌุฏุนุฉ",
"ุฏู",
"ุงููู",
"ุจุชุญุจูู",
"ุงูุฎูุฑ",
"ู",
"ุฏุงูุณุฉ",
"ู
ุนุงู",
"ู",
"ูู",
"ุญุงุฌุฉ",
"!",
"!",
"ุ",
"ุนุงุฑููู
",
"ุ",
"ุทุจ",
"ู",
"ุงููุจู",
"ู
ุนูุฏูุด",
"ุงุชูููู",
"ุณูู",
"ุฃูู
ู",
"ู
ุนุงูู
",
"ุจููุฉ",
"ุนู
ุฑู",
"=)",
"EOS"
] | [
"ุนุงุฑู",
"ุงูุช",
"ุงู+ุตุญุงุจ",
"ุงู+ุฌุฏุน+ุฉ",
"ุฏู",
"ุงููู",
"ุจ+ุชุญุจ+ู+ู",
"ุงู+ุฎูุฑ",
"ู",
"ุฏุงูุณ+ุฉ",
"ู
ุนุง+ู",
"ู",
"ูู",
"ุญุงุฌ+ุฉ",
"!",
"!",
"ุ",
"ุนุงุฑู+ูู
",
"ุ",
"ุทุจ",
"ู",
"ุงู+ูุจู",
"ู
+ุนูุฏ+ู+ุด",
"ุงุชู+ููู",
"ุณูู",
"ุฃูู
ู",
"ู
ุนุง+ูู
",
"ุจูู+ุฉ",
"ุนู
ุฑ+ู",
"=)",
"EOS"
] | [
"ADJ",
"PRON",
"DET+NOUN",
"DET+ADJ+NSUFF",
"PRON",
"PART",
"PROG_PART+V+PREP+PRON",
"DET+NOUN",
"CONJ",
"ADJ+NSUFF",
"NOUN+PRON",
"PREP",
"NOUN",
"NOUN+NSUFF",
"PUNC",
"PUNC",
"PUNC",
"ADJ+PRON",
"PUNC",
"ADJ",
"CONJ",
"DET+NOUN",
"PART+NOUN+PRON+NEG_PART",
"NUM+NSUFF",
"NOUN",
"V",
"NOUN+PRON",
"NOUN+NSUFF",
"NOUN+PRON",
"EMOT",
"EOS"
] |
3 | "A" | [
"@MahaMaamoun",
"ูู",
"ูุงุณ",
"ุจุณูุทุฉ",
"ูุงููุง",
"ุจูุณุชูููุง",
"ุนูุดุงู",
"ูุฌูุจูุง",
"ุงูู",
"ูุนูุงููู
",
"ูุงูู",
"ู
ุญุจูุณูู",
"ู
ุนุงูู
",
"ู
ู",
"ุงูุดุจุงุจ",
"ุนูุดุงู",
"ูู",
"ูุงุณ",
"ู
ุจูุฌููุงุด",
"ุญุฏ",
"ุญุงุฌุฉ",
"ู
ุคูู
ุฉ",
"EOS"
] | [
"@MahaMaamoun",
"ูู",
"ูุงุณ",
"ุจุณูุท+ุฉ",
"ูุงู+ูุง",
"ุจ+ูุณุชูู+ูุง",
"ุนูุดุงู",
"ูุฌูุจ+ูุง",
"ุงูู",
"ู+ุนูุงู+ูู
",
"ู+ุงูู",
"ู
ุญุจูุณ+ูู",
"ู
ุนุง+ูู
",
"ู
ู",
"ุงู+ุดุจุงุจ",
"ุนูุดุงู",
"ูู",
"ูุงุณ",
"ู
+ุจ+ูุฌ+ู+ูุง+ุด",
"ุญุฏ",
"ุญุงุฌ+ุฉ",
"ู
ุคูู
+ุฉ",
"EOS"
] | [
"MENTION",
"PREP",
"NOUN",
"ADJ+NSUFF",
"V+PRON",
"PROG_PART+V+PRON",
"PART",
"V+PRON",
"NOUN",
"PREP+NOUN+PRON",
"CONJ+PART",
"ADJ+NSUFF",
"NOUN+PRON",
"PREP",
"DET+NOUN",
"PART",
"PREP",
"NOUN",
"PART+PROG_PART+V+PREP+PRON+NEG_PART",
"NOUN",
"NOUN+NSUFF",
"ADJ+NSUFF",
"EOS"
] |
4 | "A" | [
"ุจูููููุง",
"ุงููู",
"ุจูุญุจู",
"ููุจูู",
"ุนูู",
"ุทุจูุนุชู",
"ู
ุนุงู",
"!",
"ุจุณ",
"ุงููู",
"ุจูุนุดูู",
"ุจูุง",
"ููุนู
ู",
"ุญุงุฌุงุช",
"ู
ุด",
"ู
ู",
"ุทุจูุนุชู",
"ุงูู",
"ูุนู
ููุง",
"ุนุดุงู",
"ุจุณ",
"ูุฑุถูู",
"ู",
"ูุนุฌุจู",
"!",
"EOS"
] | [
"ุจ+ูููู+ูุง",
"ุงููู",
"ุจ+ูุญุจ+ู",
"ู+ูุจูู",
"ุนูู",
"ุทุจูุน+ุช+ู",
"ู
ุนุง+ู",
"!",
"ุจุณ",
"ุงููู",
"ุจ+ูุนุดู+ู",
"ุจูุง",
"ู+ูุนู
ู",
"ุญุงุฌ+ุงุช",
"ู
ุด",
"ู
ู",
"ุทุจูุน+ุช+ู",
"ุงู+ู",
"ูุนู
ู+ูุง",
"ุนุดุงู",
"ุจุณ",
"ูุฑุถู+ู",
"ู",
"ูุนุฌุจ+ู",
"!",
"EOS"
] | [
"PROG_PART+V+PRON",
"PART",
"PROG_PART+V+PRON",
"FUT_PART+V",
"PREP",
"NOUN+PRON+PRON",
"NOUN+PRON",
"PUNC",
"PART",
"PART",
"PROG_PART+V+PRON",
"ADV",
"FUT_PART+V",
"NOUN+NSUFF",
"PART",
"PREP",
"NOUN+NSUFF+PRON",
"PART+PRON",
"V+PRON",
"PART",
"ADV",
"V+PRON",
"CONJ",
"V+PRON",
"PUNC",
"EOS"
] |
5 | "A" | [
"ุจุชุญุจ",
"ุญุฏ",
"ุฑูุญ",
"ูููู",
"ุ",
"ู
ุด",
"ุชููู",
"ูุฃู
ู",
"ูุง",
"ุฅูู",
"ุฅูุง",
"ุงููู",
"ููู",
"ูุฃ",
".",
".",
".",
"ููู",
"ุจุชูุฑู",
"ุญุฏ",
"ุงุจุนุฏ",
"ุนูู",
"ููุด",
"ู
ุถุทุฑ",
"ุชุนูุด",
"ุญูุงุชู",
"ูู",
"ุชู
ุซูู",
".",
".",
".",
"ุฒุนูุงู",
"ู
ู",
"ุญุฏ",
"ุฑูุญ",
"ุตูู",
"ุฃู
ูุฑู",
"ู
ุนุงู",
"EOS"
] | [
"ุจ+ุชุญุจ",
"ุญุฏ",
"ุฑูุญ",
"ูู+ู+ู",
"ุ",
"ู
ุด",
"ุชููู",
"ู+ุฃู
+ู",
"ูุง",
"ุฅูู",
"ุฅูุง",
"ุงููู",
"ู+ูู",
"ูุฃ",
".",
".",
".",
"ู+ูู",
"ุจ+ุชูุฑู",
"ุญุฏ",
"ุงุจุนุฏ",
"ุนู+ู",
"ู+ูุด",
"ู
ุถุทุฑ",
"ุชุนูุด",
"ุญูุง+ุช+ู",
"ูู",
"ุชู
ุซูู",
".",
".",
".",
"ุฒุนูุงู",
"ู
ู",
"ุญุฏ",
"ุฑูุญ",
"ุตู+ู",
"ุฃู
ูุฑ+ู",
"ู
ุนุง+ู",
"EOS"
] | [
"PROG_PART+V",
"NOUN",
"V",
"V+PREP+PRON",
"PUNC",
"PART",
"V",
"PREP+NOUN+NSUFF",
"PART",
"NOUN",
"PART",
"NOUN",
"CONJ+PRON",
"PART",
"PUNC",
"PUNC",
"PUNC",
"CONJ+PART",
"PROG_PART+V",
"NOUN",
"V",
"PREP+PRON",
"CONJ+PART",
"ADJ",
"V",
"NOUN+NSUFF+PRON",
"PREP",
"NOUN",
"PUNC",
"PUNC",
"PUNC",
"ADJ",
"PREP",
"NOUN",
"V",
"V+PRON",
"NOUN+PRON",
"NOUN+PRON",
"EOS"
] |
5 | "A" | [
"ุนุงูุฒุฉ",
"ุฃูุถูุถ",
"ู
ู",
"ุบูุฑ",
"ู
ุงุญุฏ",
"ูููู",
"ูู",
"ู
ุนูุด",
"ุฃู",
"ูููู",
"ุฃู",
"ููุถู",
".",
".",
"ูุฏู",
"ู
ูุณุชุญูู",
".",
".",
"ูุจู
ุง",
"ุฅูู",
"ุณุจุจ",
"ูุฑูู",
"ูุชุนุงูู",
"ุฃูุถูุถูู",
"ุฅูุชู",
"ูุญููู",
"ู
ุดุงูููุง",
"!",
"EOS"
] | [
"ุนุงูุฒ+ุฉ",
"ุฃูุถูุถ",
"ู
ู",
"ุบูุฑ",
"ู
ุง+ุญุฏ",
"ูููู",
"ู+ู",
"ู
ุนูุด",
"ุฃู",
"ูู+ู",
"ุฃู",
"ููุถ+ู",
".",
".",
"ู+ุฏู",
"ู
ุณุชุญูู",
".",
".",
"ู+ุจ+ู
ุง",
"ุฅู+ู",
"ุณุจุจ",
"ูุฑู+ู",
"ู+ุชุนุงู+ู",
"ุฃูุถูุถ+ู+ู",
"ุฅูุช",
"ู+ุญู+ู+ู",
"ู
ุดุงูู+ูุง",
"!",
"EOS"
] | [
"ADJ+NSUFF",
"V",
"PREP",
"NOUN",
"PART+NOUN",
"V",
"PREP+PRON",
"NOUN",
"CONJ",
"V+PRON",
"CONJ",
"V+PRON",
"PUNC",
"PUNC",
"CONJ+PRON",
"ADJ",
"PUNC",
"PUNC",
"CONJ+PREP+PART",
"PART+PRON",
"NOUN",
"NOUN+PRON",
"CONJ+V+PRON",
"V+PREP+PRON",
"PRON",
"CONJ+V+PREP+PRON",
"NOUN+PRON",
"PUNC",
"EOS"
] |
1 | "A" | [
"ุงููุงุญุฏ",
"ูู
ุง",
"ุจููุงู
",
"ูุชูุฑ",
"ุ",
"ุจูุญูู
",
"ุจุฃุญูุงู
",
"-",
"ููุง",
"ูู",
"ุงูุฃุบูุจ",
"ููุงูุณ",
"ุงู",
"ุญุงุฌุงุช",
"ุชุงููุฉ",
"ุ",
"ุจุณ",
"ุงูู
ูู
",
"ู
ุด",
"ุฃุญูุงู
",
"ูุนูู",
"-",
"ู
ุงููู
ุด",
"ุงู",
"ุนูุงูุฉ",
"ุจุจุนุถ",
"ุ",
"ู
ุชุชุงููุฉ",
"ุ",
"ูุบูุฑ",
"ู
ูุทููุฉ",
".",
"EOS"
] | [
"ุงู+ูุงุญุฏ",
"ูู
ุง",
"ุจ+ููุงู
",
"ูุชูุฑ",
"ุ",
"ุจ+ูุญูู
",
"ุจ+ุฃุญูุงู
",
"-",
"ููุง",
"ูู",
"ุงู+ุฃุบูุจ",
"ููุงูุณ",
"ุงู",
"ุญุงุฌ+ุงุช",
"ุชุงูู+ุฉ",
"ุ",
"ุจุณ",
"ุงู+ู
ูู
",
"ู
ุด",
"ุฃุญูุงู
",
"ูุนูู",
"-",
"ู
ุง+ู+ูู
+ุด",
"ุงู",
"ุนูุงู+ุฉ",
"ุจ+ุจุนุถ",
"ุ",
"ู
ุชุชุงูู+ุฉ",
"ุ",
"ู+ุบูุฑ",
"ู
ูุทูู+ุฉ",
".",
"EOS"
] | [
"DET+NOUN",
"PART",
"PROG_PART+V",
"ADJ",
"PUNC",
"PROG_PART+V",
"PREP+NOUN",
"PUNC",
"PRON",
"PREP",
"DET+ADJ",
"NOUN",
"CONJ",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PUNC",
"PART",
"DET+ADJ",
"PART",
"NOUN",
"ADV",
"PUNC",
"PART+PREP+PRON+NEG_PART",
"NOUN",
"NOUN+NSUFF",
"PREP+NOUN",
"PUNC",
"NOUN+NSUFF",
"PUNC",
"CONJ+PART",
"ADJ+NSUFF",
"PUNC",
"EOS"
] |
3 | "A" | [
"ู",
"ุญุงุฌู",
"ุธุฑููู",
"ุงูุง",
"ุดูุฑุช",
"ุงุบููู",
"ุฑููุด",
"ุน",
"ุตูุญุงุช",
"ุงูู
ูุถู",
"ูุงูุงูู",
"ูุฌุงุจุช",
"ุฑูุฏู",
"ูุนู",
"ุญููุฉ",
"ุฎุตูุตุง",
"ุจุชุงุนุช",
"ุงูุงูู",
"ุงููู",
"ุนูุฏู",
"ุจูู",
"ุจูุฌ",
"ุชุงูู",
"ููููู",
"#RanaSamahaTeam",
"EOS"
] | [
"ู",
"ุญุงุฌ+ู",
"ุธุฑูู+ู",
"ุงูุง",
"ุดูุฑ+ุช",
"ุงุบูู+ู",
"ุฑููุด",
"ุน",
"ุตูุญ+ุงุช",
"ุงู+ู
ูุถ+ู",
"ู+ุงู+ุงูู",
"ู+ุฌุงุจ+ุช",
"ุฑูุฏู",
"ูุนู",
"ุญูู+ุฉ",
"ุฎุตูุต+ุง",
"ุจุชุงุน+ุช",
"ุงู+ุงูู",
"ุงููู",
"ุนูุฏ+ู",
"ุจูู",
"ุจูุฌ",
"ุชุงูู",
"ููู+ู+ู",
"#RanaSamahaTeam",
"EOS"
] | [
"PREP",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PRON",
"V+PRON",
"NOUN+NSUFF",
"NOUN",
"PREP",
"NOUN+NSUFF",
"DET+NOUN+NSUFF",
"CONJ+DET+NOUN",
"CONJ+V+PRON",
"NOUN",
"NOUN",
"ADJ+NSUFF",
"NOUN+CASE",
"NOUN+NSUFF",
"DET+NOUN",
"PART",
"NOUN+PRON",
"ADV",
"NOUN",
"ADJ",
"V+PREP+PRON",
"HASH",
"EOS"
] |
2 | "A" | [
"ุงูุฏูููููุง",
"ุฏู",
"ุนุจุงุฑุฉ",
"ุนู",
"ุงู
ุชุญุงู",
"ู",
"ุงุญูุง",
"ููู",
"ููู
",
"ู
ุง",
"ุงูุงู
ุชุญุงู",
"ุฏุฉ",
"ุจูุฎูุต",
"ุญูุงู",
"ุงูุงูุณุงู",
"ูู
ุงู",
"ุจุชุฎูุต",
"ุณุงุนุชูุง",
"ุจูู",
"ุจูุฑูุญ",
"ูุฌูุจ",
"ูุชูุฌุชุฉ",
".",
".",
"EOS"
] | [
"ุงู+ุฏููุง",
"ุฏู",
"ุนุจุงุฑ+ุฉ",
"ุนู",
"ุงู
ุชุญุงู",
"ู",
"ุงุญูุง",
"ูู+ู",
"ููู
",
"ู
ุง",
"ุงู+ุงู
ุชุญุงู",
"ุฏุฉ",
"ุจ+ูุฎูุต",
"ุญูุง+ู",
"ุงู+ุงูุณุงู",
"ูู
ุงู",
"ุจ+ุชุฎูุต",
"ุณุงุน+ุช+ูุง",
"ุจูู",
"ุจ+ูุฑูุญ",
"ูุฌูุจ",
"ูุชูุฌ+ุช+ุฉ",
".",
".",
"EOS"
] | [
"DET+NOUN",
"PRON",
"NOUN+NSUFF",
"PREP",
"NOUN",
"CONJ",
"PRON",
"PREP+PRON",
"NOUN",
"PART",
"DET+NOUN",
"PRON",
"PROG_PART+V",
"NOUN+NSUFF",
"DET+NOUN",
"ADV",
"PROG_PART+V",
"NOUN+NSUFF+PRON",
"ADV",
"PROG_PART+V",
"V",
"NOUN+NSUFF+PRON",
"PUNC",
"PUNC",
"EOS"
] |
4 | "A" | [
"ูู
ูุข",
"ุชูุฌู",
"ุนูู",
"ููุณู",
"ูุชูุฑ",
"ุขุนุฑู",
"ุฃูู",
"ู
ูุขุดู",
"ุบูุท",
":)",
"EOS"
] | [
"ูู
ุข",
"ุชูุฌ+ู",
"ุนูู",
"ููุณ+ู",
"ูุชูุฑ",
"ุขุนุฑู",
"ุฃู+ู",
"ู
ุขุดู",
"ุบูุท",
":)",
"EOS"
] | [
"PART",
"V+PRON",
"PREP",
"NOUN+PRON",
"ADJ",
"V",
"PART+PRON",
"ADJ",
"NOUN",
"EMOT",
"EOS"
] |
4 | "A" | [
"@HanyAEllatif",
"ูู",
"ู
ุง",
"ููุด",
"ุงฺคูุฑุฉ",
"ู
ุง",
"ููุด",
"ู
ุตุฑููู",
".",
".",
"ุฑุจูุง",
"ูุฎูููุง",
"ููุฃฺคูุฑ",
"ูู
ุงู",
"ููู
ุงู",
".",
".",
"p:",
"EOS"
] | [
"@HanyAEllatif",
"ูู",
"ู
ุง",
"ูู+ุด",
"ุงููุฑ+ุฉ",
"ู
ุง",
"ูู+ุด",
"ู
ุตุฑู+ูู",
".",
".",
"ุฑุจ+ูุง",
"ูุฎู+ู+ูุง",
"ู+ูุฃููุฑ",
"ูู
ุงู",
"ู+ูู
ุงู",
".",
".",
"p:",
"EOS"
] | [
"MENTION",
"PART",
"PART",
"PREP+NEG_PART",
"NOUN+NSUFF",
"PART",
"PREP+NEG_PART",
"NOUN+NSUFF",
"PUNC",
"PUNC",
"NOUN+PRON",
"V+PRON+PRON",
"CONJ+V",
"ADV",
"CONJ+ADV",
"PUNC",
"PUNC",
"EMOT",
"EOS"
] |
4 | "A" | [
"ูุจุนุฏูู",
"ุงูุชูุง",
"ุงุฒุงู",
"ุชุจุฏุฃูุง",
"ุฏุฑูุณ",
"ู
ู",
"ูุจู",
"ุงูุฏุฑุงุณุฉ",
"ุ",
"ูุง",
"ุ",
"ูุนูู",
"ุงุฒุงู",
"ูููู",
"ุนูุฏู",
"ุฏุฑุณ",
"ุงูููุงุฑุฏุฉ",
"._.",
"EOS"
] | [
"ู+ุจุนุฏูู",
"ุงูุชูุง",
"ุงุฒุงู",
"ุชุจุฏุฃ+ูุง",
"ุฏุฑูุณ",
"ู
ู",
"ูุจู",
"ุงู+ุฏุฑุงุณ+ุฉ",
"ุ",
"ูุง",
"ุ",
"ูุนูู",
"ุงุฒุงู",
"ูููู",
"ุนูุฏ+ู",
"ุฏุฑุณ",
"ุงู+ููุงุฑุฏ+ุฉ",
"._.",
"EOS"
] | [
"CONJ+NOUN",
"PRON",
"PART",
"V+PRON",
"NOUN",
"PREP",
"NOUN",
"DET+NOUN+NSUFF",
"PUNC",
"PART",
"PUNC",
"ADV",
"PART",
"V",
"NOUN+PRON",
"NOUN",
"DET+NOUN+NSUFF",
"EMOT",
"EOS"
] |
1 | "A" | [
"ููุช",
"ุฎุงูู",
"ุงูุณูุณู",
"ูุทูุน",
"ุฐูู",
"ูู
ูุชุฑุดุญุด",
",",
",",
"ุงูุญู
ุฏ",
"ููู",
"ุงูุญู
ุงุฑ",
"ูููุจุณ",
":D",
"EOS"
] | [
"ูู+ุช",
"ุฎุงูู",
"ุงู+ุณูุณู",
"ูุทูุน",
"ุฐูู",
"ู+ู
+ูุชุฑุดุญ+ุด",
",",
",",
"ุงู+ุญู
ุฏ",
"ู+ุงููู",
"ุงู+ุญู
ุงุฑ",
"ู+ููุจุณ",
":D",
"EOS"
] | [
"V+PRON",
"ADJ",
"DET+NOUN",
"V",
"ADJ",
"CONJ+PART+V+NEG_PART",
"PUNC",
"PUNC",
"DET+NOUN",
"PREP+NOUN",
"DET+NOUN",
"FUT_PART+V",
"EMOT",
"EOS"
] |
3 | "A" | [
"@hananalyaly@ahmedadel755",
"ูู",
"ูุฒูุฑ",
"ุฏูุงุน",
"ูุงูู
",
"ูููุณ",
"ุญุฏูุฏ",
"ู
ูุตุจู",
"ูุงุญุชุฑุงู
ู",
"ู
ูุตุญุด",
"ูุชููู
",
"ูู",
"ุญุงุฌุฉ",
"ูุณุฉ",
"ู
ุด",
"ู
ูุฌูุฏุฉ",
"EOS"
] | [
"@hananalyaly@ahmedadel755",
"ูู",
"ูุฒูุฑ",
"ุฏูุงุน",
"ูุงูู
",
"ูููุณ",
"ุญุฏูุฏ",
"ู
ูุตุจ+ู",
"ู+ุงุญุชุฑุงู
+ู",
"ู
+ูุตุญ+ุด",
"ูุชููู
",
"ูู",
"ุญุงุฌ+ุฉ",
"ูุณ+ุฉ",
"ู
ุด",
"ู
ูุฌูุฏ+ุฉ",
"EOS"
] | [
"MENTION",
"PRON",
"NOUN",
"NOUN",
"ADJ",
"ADJ",
"NOUN",
"NOUN+PRON",
"CONJ+NOUN+PRON",
"PART+V+NEG_PART",
"V",
"PREP",
"NOUN+NSUFF",
"ADV+NSUFF",
"PART",
"ADJ+NSUFF",
"EOS"
] |
3 | "A" | [
"ุดูููุง",
"ุจูุจุณ",
"ุงูู
ุฏุฑุณุฉ",
"ุฏู",
"ูููุถู",
"ููุทุฉ",
"ุณูุฏุฉ",
"ูู",
"ุญูุงุชูุง",
"ุทูู",
"ู
ุงุญูุง",
"ุนุงูุดูู",
"ุ",
"ู
ุฃุณุงู",
".",
"EOS"
] | [
"ุดูู+ูุง",
"ุจ+ูุจุณ",
"ุงู+ู
ุฏุฑุณ+ุฉ",
"ุฏู",
"ู+ููุถู",
"ููุท+ุฉ",
"ุณูุฏ+ุฉ",
"ูู",
"ุญูุง+ุช+ูุง",
"ุทูู",
"ู
ุง+ุญูุง",
"ุนุงูุด+ูู",
"ุ",
"ู
ุฃุณุง+ู",
".",
"EOS"
] | [
"NOUN+PRON",
"PREP+NOUN",
"DET+NOUN+NSUFF",
"PRON",
"FUT_PART+V",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PREP",
"NOUN+NSUFF+PRON",
"NOUN",
"PART+PRON",
"ADJ+NSUFF",
"PUNC",
"NOUN+NSUFF",
"PUNC",
"EOS"
] |
5 | "A" | [
"ู
ู",
"ุงูููุงุฑุฏู",
"ููุจุฏุฃ",
"ุงูุฅุนูุงู
",
"ูุชููู
",
"ุนูู",
"ุงู",
"ุงุฏ",
"ุงูู",
"ู
ุดุงูู",
"ู
ุตุฑ",
"ูุชูุฑู",
"ูุชุญููููุง",
"ุตุนุจ",
"ูู",
"ุณูู",
"ุงู",
"ุงุชููู",
",",
"ูู
ุญุชุงุฌู",
"ุณููู",
"ุทูููู",
"ุนูุดุงู",
"ู
ุตุฑ",
"ุชุชูุฏู
",
",",
"ูู
ุญุฏุด",
"ูุณุชุนุฌู",
"EOS"
] | [
"ู
ู",
"ุงู+ููุงุฑุฏ+ู",
"ู+ูุจุฏุฃ",
"ุงู+ุฅุนูุงู
",
"ูุชููู
",
"ุนูู",
"ุงู",
"ุงุฏ",
"ุงูู",
"ู
ุดุงูู",
"ู
ุตุฑ",
"ูุชูุฑ+ู",
"ู+ุชุญููู+ูุง",
"ุตุนุจ",
"ูู",
"ุณู+ู",
"ุงู",
"ุงุชู+ูู",
",",
"ู+ู
ุญุชุงุฌ+ู",
"ุณู+ูู",
"ุทููู+ู",
"ุนูุดุงู",
"ู
ุตุฑ",
"ุชุชูุฏู
",
",",
"ู+ู
+ุญุฏ+ุด",
"ูุณุชุนุฌู",
"EOS"
] | [
"PREP",
"DET+NOUN+NSUFF",
"FUT_PART+V",
"DET+NOUN",
"V",
"PREP",
"PART",
"NOUN",
"PART",
"NOUN",
"NOUN",
"ADJ+NSUFF",
"CONJ+NOUN+PRON",
"ADJ",
"PREP",
"NOUN+NSUFF",
"CONJ",
"NUM+NSUFF",
"PUNC",
"CONJ+ADJ+NSUFF",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PART",
"NOUN",
"V",
"PUNC",
"CONJ+PART+NOUN+NEG_PART",
"V",
"EOS"
] |
2 | "A" | [
"ูุนู
ุงููู",
"ูููู",
"ูู",
"ูุตุงูุญ",
"ูุงุญูุง",
"ุนุงูุฒูู",
"ุงููู",
"ููุตุญูุง",
".",
"EOS"
] | [
"ู+ุนู
ุงู+ูู",
"ูููู",
"ูู",
"ูุตุงูุญ",
"ู+ุงุญูุง",
"ุนุงูุฒ+ูู",
"ุงููู",
"ููุตุญ+ูุง",
".",
"EOS"
] | [
"CONJ+ADJ+PRON",
"V",
"PREP",
"NOUN",
"CONJ+PRON",
"ADJ+NSUFF",
"PART",
"V+PRON",
"PUNC",
"EOS"
] |
3 | "A" | [
"ูุงุนู
",
"ุงุถุญู",
"ููุจู",
"ูููู",
"ุฃุฎุฏุช",
"ุฅูู",
"ู
ู",
"ุงูุฒุนู",
"ุ",
"ุถุญูู",
"ุจุณูุทู",
"ูู",
"ุฃู",
"ููุช",
"ู
ู
ูู",
"ุชุฏูู",
"ุฃู
ู",
":)",
"EOS"
] | [
"ูุง+ุนู
",
"ุงุถุญู",
"ู+ูุจู",
"ูู+ู+ู",
"ุฃุฎุฏ+ุช",
"ุฅูู",
"ู
ู",
"ุงู+ุฒุนู",
"ุ",
"ุถุญู+ู",
"ุจุณูุท+ู",
"ูู",
"ุฃู",
"ููุช",
"ู
ู
ูู",
"ุชุฏ+ู+ู",
"ุฃู
ู",
":)",
"EOS"
] | [
"PART+NOUN",
"V",
"CONJ+NOUN",
"V+PREP+PRON",
"V+PRON",
"PART",
"PREP",
"DET+NOUN",
"PUNC",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PREP",
"NOUN",
"NOUN",
"ADJ",
"V+PRON+PRON",
"NOUN",
"EMOT",
"EOS"
] |
1 | "A" | [
"ู
ุจูุชุด",
"ู
ุดููู",
"ุงููู
",
"ูุฏุงูููู",
"ููุง",
"ุญุชู",
"ูุฒุนููู",
"ุนุงุฏู",
"ุงุตูุง",
"ุ",
"ุงูู
ุดููู",
"ุงูู",
"ููุช",
"ูุงูุฑูู
",
"ุญุงุฌู",
"ุชุงููู",
"ุบูุฑ",
"ูุฏู",
"#ุฏููุง",
"#ุงู_ูุงููู",
"EOS"
] | [
"ู
+ุจู+ุช+ุด",
"ู
ุดูู+ู",
"ุงู+ูู
",
"ูุฏุงูู+ู+ู",
"ู+ูุง",
"ุญุชู",
"ูุฒุนู+ู+ู",
"ุนุงุฏู",
"ุงุตู+ุง",
"ุ",
"ุงู+ู
ุดูู+ู",
"ุงู+ู",
"ูู+ุช",
"ูุงูุฑ+ูู
",
"ุญุงุฌ+ู",
"ุชุงูู+ู",
"ุบูุฑ",
"ูุฏู",
"#ุฏููุง",
"#ุงู_ูุงููู",
"EOS"
] | [
"PART+V+PRON+NEG_PART",
"NOUN+NSUFF",
"PART+PRON",
"V+PRON+PRON",
"CONJ+PART",
"PART",
"V+PRON+PRON",
"ADJ",
"NOUN+CASE",
"PUNC",
"DET+NOUN+NSUFF",
"PART+PRON",
"V+PRON",
"ADJ+PRON",
"NOUN+NSUFF",
"ADJ+NSUFF",
"NOUN",
"ADV",
"HASH",
"HASH",
"EOS"
] |
2 | "A" | [
"ุนุงุฑู",
"ุงููู",
"ุจุชุตุญู",
"ุชููู
ู",
"ุงูู",
"ูุงุญุฏ",
"ู",
"ูุจู",
"ู
ุง",
"ุชูุงู
",
"ูููู",
"ูู",
"ุงุฎุฑ",
"ูุงุญุฏ",
"ู
ููู
ู",
"ุ",
"ู
ููุด",
"ุงูู
",
"ู
ูู",
"ูู",
"ุญูุงุชู",
"EOS"
] | [
"ุนุงุฑู",
"ุงููู",
"ุจ+ุชุตุญู",
"ุชููู
+ู",
"ุงูู",
"ูุงุญุฏ",
"ู",
"ูุจู",
"ู
ุง",
"ุชูุงู
",
"ูููู",
"ูู",
"ุงุฎุฑ",
"ูุงุญุฏ",
"ู
ููู
+ู",
"ุ",
"ู
+ูู+ุด",
"ุงูู
",
"ู
ู+ู",
"ูู",
"ุญูุง+ุช+ู",
"EOS"
] | [
"ADJ",
"PART",
"PROG_PART+V",
"V+PRON",
"NUM",
"NOUN",
"CONJ",
"NOUN",
"PART",
"V",
"V",
"PRON",
"ADJ",
"NOUN",
"ADJ+PRON",
"PUNC",
"PART+PREP+NEG_PART",
"ADJ",
"PREP+PRON",
"PREP",
"NOUN+NSUFF+PRON",
"EOS"
] |
1 | "A" | [
"ูุจู
ุง",
"ุงู",
"ุณูุงู",
"ุงูู
ููุฑูุจุงุต",
"ูู",
"ุงูุจูุฏ",
"ุฏู",
"ุจูุชูุงูู",
"ูุง",
"ูุงู
ุดู
ููุฏุณ",
"ููู",
"ุทุจูุนู",
"ุฌุฏุง",
"ุงู",
"ุงูู
ููุฏุณ",
"ูุชูุงูู",
"ูุง",
"ุงุณุทู",
"#ู
ุตุฑ",
"EOS"
] | [
"ู+ุจ+ู
ุง",
"ุงู",
"ุณูุงู",
"ุงู+ู
ููุฑูุจุงุต",
"ูู",
"ุงู+ุจูุฏ",
"ุฏู",
"ุจ+ูุชูุง+ู+ู",
"ูุง",
"ูุง+ู
ุดู
ููุฏุณ",
"ู",
"ุทุจูุนู",
"ุฌุฏ+ุง",
"ุงู",
"ุงู+ู
ููุฏุณ",
"ูุชูุง+ู+ู",
"ูุง",
"ุงุณุทู",
"#ู
ุตุฑ",
"EOS"
] | [
"CONJ+PREP+PART",
"PART",
"NOUN",
"DET+NOUN",
"PREP",
"DET+NOUN",
"PRON",
"PROG_PART+V+PREP+PRON",
"PART",
"PART+NOUN",
"CONJ",
"ADJ",
"NOUN+CASE",
"PART",
"DET+NOUN",
"V+PREP+PRON",
"PART",
"NOUN",
"HASH",
"EOS"
] |
4 | "A" | [
"ู
ุด",
"ูุนุฑู",
"ุงูุตู",
"ููุงูู",
"ููุง",
"ุงูุฉ",
".",
"ูู",
"ู
ุง",
"ุงููู",
"ูุงูุช",
".",
"ุงูุงูู",
"ูู
",
"ุญุฏ",
"ุนู
ูู",
"ุงููููู",
".",
"ุญุฑุงู
",
"ุนูููู
",
"ู
ุด",
"ูุฏุฉ",
".",
"ูุชุนูุฏููุง",
"ูู",
"ููุณูุง",
"ูุง",
"ุฌุฏุนุงู",
".",
"EOS"
] | [
"ู
ุด",
"ู+ุนุฑู",
"ุงูุตู",
"ู+ุงู+ุงูู",
"ู+ูุง",
"ุงูุฉ",
".",
"ูู",
"ู
ุง",
"ุงููู",
"ูุงู+ุช",
".",
"ุงูุงูู",
"ูู
",
"ุญุฏ",
"ุนู
+ู+ู",
"ุงููููู",
".",
"ุญุฑุงู
",
"ุนูู+ูู
",
"ู
ุด",
"ูุฏุฉ",
".",
"ู+ุชุนูุฏ+ู+ูุง",
"ูู",
"ููุณ+ูุง",
"ูุง",
"ุฌุฏุนุงู",
".",
"EOS"
] | [
"PART",
"FUT_PART+V",
"V",
"PREP+DET+NUM",
"CONJ+PART",
"PART",
"PUNC",
"NOUN",
"PART",
"V",
"V+PRON",
"PUNC",
"V",
"NOUN",
"NOUN",
"V+PREP+PRON",
"NOUN",
"PUNC",
"NOUN",
"PREP+PRON",
"PART",
"ADV",
"PUNC",
"FUT_PART+V+PRON+PRON",
"PREP",
"NOUN+PRON",
"PART",
"NOUN",
"PUNC",
"EOS"
] |
4 | "A" | [
"ุฅุญุณุงุณ",
"ูุง",
"ููุตู",
"ุฅูู",
"ุชูุฒู",
"ุชุนู
ู",
"ุดูุจููุฌ",
"ู",
"ุชุดุชุฑู",
"ูู",
"ุฅููู",
"ุนุงูุฒู",
"ู
ู",
"ุบูุฑ",
"ู
ุง",
"ุชุฏูู",
"ุฏู",
"ุจูุงู
",
"ู",
"ุฏู",
"ุจูุงู
",
".",
".",
"EOS"
] | [
"ุฅุญุณุงุณ",
"ูุง",
"ููุตู",
"ุฅู+ู",
"ุชูุฒู",
"ุชุนู
ู",
"ุดูุจููุฌ",
"ู",
"ุชุดุชุฑู",
"ูู",
"ุฅููู",
"ุนุงูุฒ+ู",
"ู
ู",
"ุบูุฑ",
"ู
ุง",
"ุชุฏูู",
"ุฏู",
"ุจ+ูุงู
",
"ู",
"ุฏู",
"ุจ+ูุงู
",
".",
".",
"EOS"
] | [
"NOUN",
"PART",
"V",
"PART+PRON",
"V",
"V",
"NOUN",
"CONJ",
"V",
"NOUN",
"PART",
"ADJ+PRON",
"PREP",
"NOUN",
"PART",
"V",
"PRON",
"PREP+PART",
"CONJ",
"PRON",
"PREP+PART",
"PUNC",
"PUNC",
"EOS"
] |
3 | "A" | [
"@Nodygamal93",
"ุงุญุณุงุณ",
"ุญูู",
"ูู
ุง",
"ุชูุงูู",
"ุญุฏ",
"ุดุจูู",
"ูู",
"ุญุงุฌุงุช",
"ูุชูุฑุฉ",
",",
"ูููุชู
",
"ุจููุณ",
"ุงูุญุงุฌุงุช",
"ุงููู",
"ุจุชุญุจูุง",
".",
"ูุงูุฑู",
"ุชุคุงู
",
"ุชุคุงู
",
":-D",
"EOS"
] | [
"@Nodygamal93",
"ุงุญุณุงุณ",
"ุญูู",
"ูู
ุง",
"ุชูุงูู",
"ุญุฏ",
"ุดุจู+ู",
"ูู",
"ุญุงุฌ+ุงุช",
"ูุชูุฑ+ุฉ",
",",
"ู+ููุชู
",
"ุจ+ููุณ",
"ุงู+ุญุงุฌ+ุงุช",
"ุงููู",
"ุจ+ุชุญุจ+ูุง",
".",
"ูุงูุฑ+ู",
"ุชุคุงู
",
"ุชุคุงู
",
":-D",
"EOS"
] | [
"MENTION",
"NOUN",
"ADJ",
"PART",
"V",
"NOUN",
"NOUN+PRON",
"PREP",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PUNC",
"CONJ+V",
"PREP+NOUN",
"DET+NOUN+NSUFF",
"PART",
"PROG_PART+V+PRON",
"PUNC",
"ADJ+PRON",
"NOUN",
"NOUN",
"EMOT",
"EOS"
] |
2 | "A" | [
"ุงูุง",
"ุนุงูุฒ",
"ูุจูู",
"ุนูุฏู",
"ุงุจู",
"ุนุดุงู",
"ุงุนูู
ู",
"ุงูุณุจุงุญุฉ",
"ุจุณ",
",",
",",
",",
"ุฏู",
"ุฃู
ุชุน",
"ุญุงุฌุฉ",
"ู
ู
ูู",
"ุงูุฃุจ",
"ูุนู
ููุง",
"ุงูุญูููุฉ",
",",
",",
",",
"ุบูุฑ",
"ูุฏู",
"ุงูู
ูุถูุน",
"ู
ุด",
"ุฌุงูุจ",
"ูู
ู",
"EOS"
] | [
"ุงูุง",
"ุนุงูุฒ",
"ูุจูู",
"ุนูุฏ+ู",
"ุงุจู",
"ุนุดุงู",
"ุงุนูู
+ู",
"ุงู+ุณุจุงุญ+ุฉ",
"ุจุณ",
",",
",",
",",
"ุฏู",
"ุฃู
ุชุน",
"ุญุงุฌ+ุฉ",
"ู
ู
ูู",
"ุงู+ุฃุจ",
"ูุนู
ู+ูุง",
"ุงู+ุญููู+ุฉ",
",",
",",
",",
"ุบูุฑ",
"ูุฏู",
"ุงู+ู
ูุถูุน",
"ู
ุด",
"ุฌุงูุจ",
"ูู
+ู",
"EOS"
] | [
"PRON",
"ADJ",
"V",
"NOUN+PRON",
"NOUN",
"PART",
"V+PRON",
"DET+NOUN+NSUFF",
"ADV",
"PUNC",
"PUNC",
"PUNC",
"PRON",
"ADJ",
"NOUN+NSUFF",
"ADJ",
"DET+NOUN",
"V+PRON",
"DET+NOUN+NSUFF",
"PUNC",
"PUNC",
"PUNC",
"NOUN",
"ADV",
"DET+NOUN",
"PART",
"ADJ",
"NOUN+PRON",
"EOS"
] |
4 | "A" | [
"ุฎุณุงุฑุฉ",
"ููู",
"ููู
ุฉ",
"ุฑุงุฌู",
"ูู",
"ุจุชุณูุจ",
"ุตุญุงุจู",
"ูุชููู
ูุง",
"ุนูู",
"ุจูุช",
"ุฃูุช",
"ุชุนุฑููุง",
"ู
ู",
"ุบูุฑ",
"ู
ุงุชุฑุฏ",
"ุนูููู
",
".",
"EOS"
] | [
"ุฎุณุงุฑ+ุฉ",
"ูู+ู",
"ููู
+ุฉ",
"ุฑุงุฌู",
"ูู",
"ุจ+ุชุณูุจ",
"ุตุญุงุจ+ู",
"ูุชููู
+ูุง",
"ุนูู",
"ุจูุช",
"ุฃูุช",
"ุชุนุฑู+ูุง",
"ู
ู",
"ุบูุฑ",
"ู
ุง+ุชุฑุฏ",
"ุนูู+ูู
",
".",
"EOS"
] | [
"NOUN+NSUFF",
"PREP+PRON",
"NOUN+NSUFF",
"NOUN",
"PART",
"PROG_PART+V",
"NOUN+PRON",
"V+PRON",
"PREP",
"NOUN",
"PRON",
"V+PRON",
"PREP",
"NOUN",
"PART+V",
"PREP+PRON",
"PUNC",
"EOS"
] |
4 | "A" | [
"Serious",
"Question",
":",
"ููู",
"ุงููุงุญุฏ",
"ูู
ุง",
"ูุจูู",
"ู
ุจุณูุท",
"ุทูู",
"ุงูููุงุฑ",
"ูุงุฒู
",
"ุชุญุตู",
"ูู",
"ุงูุฃุฎุฑ",
"ุญุงุฌุฉ",
"ุชููุฏ",
"ุนููู",
"ุ",
"!",
"EOS"
] | [
"Serious",
"Question",
":",
"ููู",
"ุงู+ูุงุญุฏ",
"ูู
ุง",
"ูุจูู",
"ู
ุจุณูุท",
"ุทูู",
"ุงู+ููุงุฑ",
"ูุงุฒู
",
"ุชุญุตู",
"ูู",
"ุงู+ุฃุฎุฑ",
"ุญุงุฌ+ุฉ",
"ุชููุฏ",
"ุนูู+ู",
"ุ",
"!",
"EOS"
] | [
"FOREIGN",
"FOREIGN",
"PUNC",
"PART",
"DET+NOUN",
"PART",
"V",
"ADJ",
"NOUN",
"DET+NOUN",
"ADJ",
"V",
"PREP",
"DET+ADJ",
"NOUN+NSUFF",
"V",
"PREP+PRON",
"PUNC",
"PUNC",
"EOS"
] |
5 | "A" | [
"ูู",
"ูุงุญุฏ",
"ููุฌู",
"ููููู",
"ู
ุด",
"ููุฏุฑ",
"ุฃุบูุฑ",
"ุฅุฑุซ",
"ุณููู",
"ู
ู",
"ุงููุณุงุฏ",
".",
"ุทูุจ",
"ุญุถุฑุชู",
"ุจุชุชุนุจ",
"ููุณู",
"ูุฌุงู",
"ุชุญูู
",
"ููู",
"ุ",
"EOS"
] | [
"ูู",
"ูุงุญุฏ",
"ููุฌู",
"ููู+ู+ู",
"ู
ุด",
"ู+ูุฏุฑ",
"ุฃุบูุฑ",
"ุฅุฑุซ",
"ุณู+ูู",
"ู
ู",
"ุงู+ูุณุงุฏ",
".",
"ุทูุจ",
"ุญุถุฑ+ุช+ู",
"ุจ+ุชุชุนุจ",
"ููุณ+ู",
"ู+ุฌุงู",
"ุชุญูู
",
"ููู",
"ุ",
"EOS"
] | [
"NOUN",
"NOUN",
"V",
"V+PREP+PRON",
"PART",
"FUT_PART+V",
"V",
"NOUN",
"NOUN+NSUFF",
"PREP",
"DET+NOUN",
"PUNC",
"ADJ",
"NOUN+NSUFF+PRON",
"PROG_PART+V",
"NOUN+PRON",
"CONJ+ADJ",
"V",
"PART",
"PUNC",
"EOS"
] |
3 | "A" | [
"ูุจู",
"ู
ุง",
"ุชูุงู
",
"ุงุธุจุช",
"ู
ูุจู",
"ุงูู
ูุจุงูู",
"ุนูู",
"ู
ูุนุงุฏ",
"ุตูุงุฉ",
"ุงููุฌุฑ",
"ุนุดุงู",
"ูู",
"ู
ุตุญุชุด",
"ุชุงูู",
"ุงูููุฉ",
"ุชุดูุนูู",
"EOS"
] | [
"ูุจู",
"ู
ุง",
"ุชูุงู
",
"ุงุธุจุช",
"ู
ูุจู",
"ุงู+ู
ูุจุงูู",
"ุนูู",
"ู
ูุนุงุฏ",
"ุตูุง+ุฉ",
"ุงู+ูุฌุฑ",
"ุนุดุงู",
"ูู",
"ู
+ุตุญ+ุช+ุด",
"ุชุงูู",
"ุงู+ูู+ุฉ",
"ุชุดูุน+ู+ู",
"EOS"
] | [
"NOUN",
"PART",
"V",
"V",
"NOUN",
"DET+NOUN",
"PREP",
"NOUN",
"NOUN+NSUFF",
"DET+NOUN",
"PART",
"PART",
"PART+V+PRON+NEG_PART",
"ADJ",
"DET+NOUN+NSUFF",
"V+PREP+PRON",
"EOS"
] |
4 | "A" | [
"ุญุชู",
"ูู",
"ูุดูุช",
"ู",
"ุญุงุฌุฉ",
"ูุชุชุนูู
",
"ู
ููุง",
"ุจุฑุถู",
".",
"ุงูุง",
"ูู",
"ุงูุช",
"ุบุจู",
"EOS"
] | [
"ุญุชู",
"ูู",
"ูุดู+ุช",
"ู",
"ุญุงุฌ+ุฉ",
"ู+ุชุชุนูู
",
"ู
ู+ูุง",
"ุจุฑุถู",
".",
"ุงูุง",
"ูู",
"ุงูุช",
"ุบุจู",
"EOS"
] | [
"PART",
"PART",
"V+PRON",
"PREP",
"NOUN+NSUFF",
"FUT_PART+V",
"PREP+PRON",
"ADV",
"PUNC",
"PART",
"PART",
"PRON",
"ADJ",
"EOS"
] |
2 | "A" | [
"ูู",
"ูุงุฒู
",
"ุงููุงุญุฏ",
"ูู
ุง",
"ูุฌู",
"ููุงุธุจ",
"ุนูู",
"ุงูุฑูุงุถู",
"ูุฏู
ููุง",
"ููุง",
"ุงูุชูุง",
"ูุงุฎุฏููุง",
"ู
ูุถู",
"ููุง",
"ุงูู",
"ุ",
"#bassem",
"#hit",
"EOS"
] | [
"ูู",
"ูุงุฒู
",
"ุงู+ูุงุญุฏ",
"ูู
ุง",
"ูุฌู",
"ููุงุธุจ",
"ุนูู",
"ุงู+ุฑูุงุถ+ู",
"ูุฏู
ู+ูุง",
"ู+ูุง",
"ุงูุชูุง",
"ูุงุฎุฏ+ู+ูุง",
"ู
ูุถ+ู",
"ู+ูุง",
"ุงูู",
"ุ",
"#bassem",
"#hit",
"EOS"
] | [
"PRON",
"ADJ",
"DET+NOUN",
"PART",
"V",
"V",
"PREP",
"DET+NOUN+NSUFF",
"V+PRON",
"CONJ+PART",
"PRON",
"ADJ+NSUFF+PRON",
"NOUN+NSUFF",
"CONJ+PART",
"PART",
"PUNC",
"HASH",
"HASH",
"EOS"
] |
2 | "A" | [
"ุงููู",
"ูุดูููู",
"ูู",
"ุนุฒ",
"ูุฑุญู",
"ู
ูุนุฑูููุด",
"ููุช",
"ุฒุนูู",
".",
"EOS"
] | [
"ุงููู",
"ูุดูู+ูู",
"ูู",
"ุนุฒ",
"ูุฑุญ+ู",
"ู
+ูุนุฑู+ูู+ุด",
"ููุช",
"ุฒุนู+ู",
".",
"EOS"
] | [
"PART",
"V+PRON",
"PREP",
"NOUN",
"NOUN+PRON",
"PART+V+PRON+NEG_PART",
"NOUN",
"NOUN+PRON",
"PUNC",
"EOS"
] |
3 | "A" | [
"ุฏุขูู
ุข",
"#ุขูุดุฎุต",
"ุฅููู",
"ุจูุขุฎุฏ",
"ุจุขูู",
"ู
ู",
"ุขูุชูุขุตูู",
"ุขูุตุบูุฑู",
"ุจูุจูู",
"ุฃูุชุฑ",
"ุดุฎุต",
"ู
ููุฏ",
"ุฏุขูู
ุข",
"ุนูู",
"ููุณู",
"!",
"#ุญูููู",
"EOS"
] | [
"ุฏุขูู
+ุข",
"#ุขูุดุฎุต",
"ุฅููู",
"ุจ+ูุขุฎุฏ",
"ุจุขู+ู",
"ู
ู",
"ุขู+ุชูุขุตูู",
"ุขู+ุตุบูุฑ+ู",
"ุจ+ูุจูู",
"ุฃูุชุฑ",
"ุดุฎุต",
"ู
ููุฏ",
"ุฏุขูู
+ุข",
"ุนูู",
"ููุณ+ู",
"!",
"#ุญูููู",
"EOS"
] | [
"ADJ+CASE",
"HASH",
"PART",
"PROG_PART+V",
"NOUN+PRON",
"PREP",
"DET+NOUN",
"DET+ADJ+NSUFF",
"PROG_PART+V",
"ADJ",
"NOUN",
"ADJ",
"ADJ+CASE",
"PREP",
"NOUN+PRON",
"PUNC",
"HASH",
"EOS"
] |
4 | "A" | [
"(",
"2",
")",
"ุชูุฌู",
"ูุชููู
",
"ู",
"ูููู",
"ูุงู
",
"ูุตูุญุฉ",
"ุนูู",
"ูุงู
",
"ููู
ุฉ",
"ุญููุฉ",
"ุนูู",
"ุญุจุฉ",
"ุฃู",
"ููุงู
",
"ุนุดุงู",
"ูุงู
",
"ุฑูุชููุช",
"EOS"
] | [
"(",
"2",
")",
"ุชูุฌ+ู",
"ูุชููู
",
"ู",
"ูููู",
"ูุงู
",
"ูุตูุญ+ุฉ",
"ุนูู",
"ูุงู
",
"ููู
+ุฉ",
"ุญูู+ุฉ",
"ุนูู",
"ุญุจ+ุฉ",
"ุฃู",
"ููุงู
",
"ุนุดุงู",
"ูุงู
",
"ุฑูุชููุช",
"EOS"
] | [
"PUNC",
"NUM",
"PUNC",
"V+PRON",
"V",
"CONJ",
"V",
"NOUN",
"NOUN+NSUFF",
"PREP",
"NOUN",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PREP",
"NOUN+NSUFF",
"NOUN",
"NOUN",
"PART",
"NOUN",
"NOUN",
"EOS"
] |
5 | "A" | [
"ูุงูุฑ",
"ุฃูุงู
",
"ูู
ุงุง",
"ููุช",
"ุชูู",
"ุน",
"ุงูุดุงุฑุน",
"ุชูุงูู",
"ูุงุญุฏู",
"ู
ุญุฌุจู",
"ููุงุญุฏ",
"ุตุงุญุจู",
"ูุนุงูุณูุง",
"ุชูููู",
"ุจุณ",
"ูุงุถ",
"ุฏู",
"ู
ุญุฌุจู",
"ุ",
"EOS"
] | [
"ูุงูุฑ",
"ุฃูุงู
",
"ูู
ุงุง",
"ูู+ุช",
"ุชูู",
"ุน",
"ุงู+ุดุงุฑุน",
"ุชูุงูู",
"ูุงุญุฏ+ู",
"ู
ุญุฌุจ+ู",
"ู+ูุงุญุฏ",
"ุตุงุญุจ+ู",
"ูุนุงูุณ+ูุง",
"ุชูู+ู+ู",
"ุจุณ",
"ูุง+ุถ",
"ุฏู",
"ู
ุญุฌุจ+ู",
"ุ",
"EOS"
] | [
"ADJ",
"NOUN",
"PART",
"V+PRON",
"V",
"PREP",
"DET+NOUN",
"V",
"NOUN+NSUFF",
"ADJ+NSUFF",
"CONJ+NOUN",
"NOUN+PRON",
"V+PRON",
"V+PREP+PRON",
"PART",
"PART+NOUN",
"PRON",
"ADJ+NSUFF",
"PUNC",
"EOS"
] |
2 | "A" | [
"ูู",
"ุฑูุนูุง",
"ูุถูุฉ",
"ุนูู",
"ุงูููุงู",
"ุงูุตููููู",
"ุจูููู",
"ุงููู
",
"ุฅุฑูุงุจููู",
"ู",
"ุจูุทุงูุจ",
"ุจูุทุน",
"ุฃู",
"ุนูุงูุฉ",
"ุจููู
",
"ูุชุชูุจู",
"ุงููุถูุฉ",
"ุจุฑุถู",
"ุฒู",
"ุญู
ุงุณ",
"ุ",
"ููุง",
"ููููู",
"ุนูุจ",
"ู
ุด",
"ุงุฎุชุตุงุตูุง",
"ุ",
"!",
"EOS"
] | [
"ูู",
"ุฑูุน+ูุง",
"ูุถู+ุฉ",
"ุนูู",
"ุงู+ููุงู",
"ุงู+ุตููููู",
"ุจ+ูููู",
"ุงู+ูู
",
"ุฅุฑูุงุจู+ูู",
"ู",
"ุจ+ูุทุงูุจ",
"ุจ+ูุทุน",
"ุฃู",
"ุนูุงู+ุฉ",
"ุจู+ูู
",
"ู+ุชุชูุจู",
"ุงู+ูุถู+ุฉ",
"ุจุฑุถู",
"ุฒู",
"ุญู
ุงุณ",
"ุ",
"ู+ูุง",
"ู+ูููู",
"ุนูุจ",
"ู
ุด",
"ุงุฎุชุตุงุต+ูุง",
"ุ",
"!",
"EOS"
] | [
"PART",
"V+PRON",
"NOUN+NSUFF",
"PREP",
"DET+NOUN",
"DET+ADJ",
"PROG_PART+V",
"PART+PRON",
"ADJ+NSUFF",
"CONJ",
"PROG_PART+V",
"PREP+NOUN",
"NOUN",
"NOUN+NSUFF",
"PREP+PRON",
"FUT_PART+V",
"DET+NOUN+NSUFF",
"ADV",
"NOUN",
"NOUN",
"PUNC",
"CONJ+PART",
"FUT_PART+V",
"NOUN",
"PART",
"NOUN+PRON",
"PUNC",
"PUNC",
"EOS"
] |
1 | "A" | [
"ุฏุงูู
ุง",
"ุงููุงุญุฏ",
"#ุจููุตุฑ",
"ูู",
"ุญู",
"ูุงุณ",
"#ุชุณุชุงูู",
"ููุณุฃู",
"ุนูู",
"#ูุงุณ",
"#ู
ุชุณุชููุด",
":-(",
"EOS"
] | [
"ุฏุงูู
+ุง",
"ุงู+ูุงุญุฏ",
"#ุจููุตุฑ",
"ูู",
"ุญู",
"ูุงุณ",
"#ุชุณุชุงูู",
"ู+ูุณุฃู",
"ุนูู",
"#ูุงุณ",
"#ู
ุชุณุชููุด",
":-(",
"EOS"
] | [
"ADJ+CASE",
"DET+NOUN",
"HASH",
"PREP",
"NOUN",
"NOUN",
"HASH",
"CONJ+V",
"PREP",
"HASH",
"NOUN",
"EMOT",
"EOS"
] |
4 | "A" | [
"ู
ูู",
"ุงูุช",
"ู
ุงุชุญุทููุด",
"ุฅู
ุชุญุงู",
"ุตุนุจ",
"ู",
"ุชูุฌู",
"ูู",
"ุงูุขุฎุฑ",
"ุชูููู",
"\"",
"Good",
"Luck",
"\"",
"ุนุดุงู",
"ู
ุงุชุฌูุจุด",
"ุงูุดุชูู
ู",
"ููู",
"ู",
"ููุณุช",
"ุงููุงูุฏู",
"EOS"
] | [
"ู
+ูู",
"ุงูุช",
"ู
ุง+ุชุญุท+ู+ู+ุด",
"ุฅู
ุชุญุงู",
"ุตุนุจ",
"ู",
"ุชูุฌู",
"ูู",
"ุงู+ุขุฎุฑ",
"ุชูู+ู+ู",
"\"",
"Good",
"Luck",
"\"",
"ุนุดุงู",
"ู
ุง+ุชุฌูุจ+ุด",
"ุงู+ุดุชูู
+ู",
"ูู+ู",
"ู",
"ู+ุงู+ุณุช",
"ุงู+ูุงูุฏ+ู",
"EOS"
] | [
"PART+PRON",
"PRON",
"PART+V+PREP+PRON+NEG_PART",
"NOUN",
"ADJ",
"CONJ",
"V",
"PREP",
"DET+ADJ",
"V+PREP+PRON",
"PUNC",
"FOREIGN",
"FOREIGN",
"PUNC",
"PART",
"PART+V+NEG_PART",
"DET+NOUN+NSUFF",
"PREP+PRON",
"CONJ",
"PREP+DET+NOUN",
"DET+NOUN+NSUFF",
"EOS"
] |
5 | "A" | [
"ูุงููู",
"ูุงู",
"ูู",
"ุดุบูู",
"ููุณู",
"ุฑุงุฌุน",
"ูุงููู",
"ูุงู",
"ูู",
"ู
ุฏุฑุณุชู",
"ูุงููู",
"ูุงูู",
"ูู",
"ุงูุจููููุฉ",
"ุจูุดุฑุจ",
"ุณูุฌุงุฑุฉ",
".",
".",
"ูุญุจ",
"ููููู",
"ุงู",
"ุงูุฒูู",
"ุฌุงุจ",
"ุฌูู",
".",
".",
".",
"http://t.co/SP1RsPjMxY",
"EOS"
] | [
"ู+ุงููู",
"ูุงู",
"ูู",
"ุดุบู+ู",
"ู+ูุณ+ู",
"ุฑุงุฌุน",
"ู+ุงููู",
"ูุงู",
"ูู",
"ู
ุฏุฑุณ+ุช+ู",
"ู+ุงููู",
"ูุงูู",
"ูู",
"ุงู+ุจูููู+ุฉ",
"ุจ+ูุดุฑุจ",
"ุณูุฌุงุฑ+ุฉ",
".",
".",
"ูุญุจ",
"ููู+ู+ู",
"ุงู",
"ุงูุฒูู",
"ุฌุงุจ",
"ุฌูู",
".",
".",
".",
"http://t.co/SP1RsPjMxY",
"EOS"
] | [
"CONJ+PART",
"V",
"PREP",
"NOUN+PRON",
"CONJ+ADV+NSUFF",
"ADJ",
"CONJ+PART",
"V",
"PREP",
"NOUN+NSUFF+PRON",
"CONJ+PART",
"ADJ",
"PREP",
"DET+NOUN+NSUFF",
"PROG_PART+V",
"NOUN+NSUFF",
"PUNC",
"PUNC",
"V",
"V+PREP+PRON",
"PART",
"NOUN",
"V",
"NOUN",
"PUNC",
"PUNC",
"PUNC",
"URL",
"EOS"
] |
2 | "A" | [
"ูุต",
"ุงูู๏ปปุฏ",
"ุงููู",
"ู",
"ุชููุชุฑ",
"ููู
ูู",
"ุงูุจูุช",
"ุนุงูุฒู",
"ุงูู",
".",
".",
"ู",
"ุจุชุญุจ",
"ุงูู",
"!",
"!",
"ุงูุง",
"ุจูู",
"ุงุดู",
"ุงู",
"ู",
"ุญุฏ",
"ุจูุนู
ู",
"ุจ",
"ุงููู",
"ุจูููููุง",
"ุฏู",
".",
".",
".",
"#ู๏ปปู
",
"ู
ู",
"ุบูุฑ",
"ูุนู",
"EOS"
] | [
"ูุต",
"ุงู+ููุงุฏ",
"ุงููู",
"ู",
"ุชููุชุฑ",
"ููู
+ูู",
"ุงู+ุจูุช",
"ุนุงูุฒ+ู",
"ุงูู",
".",
".",
"ู",
"ุจ+ุชุญุจ",
"ุงูู",
"!",
"!",
"ุงูุง",
"ุจูู",
"ุงุดู",
"ุงู",
"ู",
"ุญุฏ",
"ุจ+ูุนู
ู",
"ุจ",
"ุงููู",
"ุจ+ูููู+ูุง",
"ุฏู",
".",
".",
".",
"#ู๏ปปู
",
"ู
ู",
"ุบูุฑ",
"ูุนู",
"EOS"
] | [
"NOUN",
"DET+NOUN",
"PART",
"PREP",
"NOUN",
"ADJ+NSUFF",
"DET+NOUN",
"ADJ+NSUFF",
"PART",
"PUNC",
"PUNC",
"CONJ",
"PROG_PART+V",
"PART",
"PUNC",
"PUNC",
"PRON",
"ADV",
"V",
"PART",
"PREP",
"NOUN",
"PROG_PART+V",
"PREP",
"PART",
"PROG_PART+V+PRON",
"PRON",
"PUNC",
"PUNC",
"PUNC",
"HASH",
"PREP",
"NOUN",
"NOUN",
"EOS"
] |
5 | "A" | [
"ู
ุด",
"ูู",
"ุญุงุฌู",
"ุชุนู
ููุง",
"ุชููู",
"ุงูู",
"ุฑุงุฌู",
"ู",
"ุจุฑุงุญุชู",
".",
".",
"#ูู
ุง",
"ุชู
ูุช",
"ู
ุด",
"ูุชููู",
"ุงุตู",
"ููุช",
"ุฑุงุฌู",
"ููุงู",
"ุจุฑุงุญุชู",
"#ู
ููุด",
"ุชูุฑูู",
"ููุงู",
"ูุง",
"ุตุงุญุจู",
"!",
"EOS"
] | [
"ู
ุด",
"ูู",
"ุญุงุฌ+ู",
"ุชุนู
ู+ูุง",
"ุชููู",
"ุงู+ู",
"ุฑุงุฌู",
"ู",
"ุจ+ุฑุงุญ+ุช+ู",
".",
".",
"#ูู
ุง",
"ุชู
ูุช",
"ู
ุด",
"ู+ุชููู",
"ุงุตู",
"ูู+ุช",
"ุฑุงุฌู",
"ู+ูุงู",
"ุจ+ุฑุงุญ+ุช+ู",
"#ู
ููุด",
"ุชูุฑู+ู",
"ููุงู",
"ูุง",
"ุตุงุญุจ+ู",
"!",
"EOS"
] | [
"PART",
"NOUN",
"NOUN+NSUFF",
"V+PRON",
"V",
"PART+PRON",
"NOUN",
"CONJ",
"PREP+NOUN+NSUFF+PRON",
"PUNC",
"PUNC",
"HASH",
"V",
"PART",
"FUT_PART+V",
"NOUN",
"V+PRON",
"NOUN",
"CONJ+V",
"PREP+NOUN+NSUFF+PRON",
"HASH",
"NOUN+NSUFF",
"ADV",
"PART",
"NOUN+NSUFF",
"PUNC",
"EOS"
] |
4 | "A" | [
"ุงูู",
"ุชุจูู",
"ูุงุทู",
"ุฏู",
"ุญุงุฌู",
"ุณููู",
"ุงูู",
".",
".",
"ุจุณ",
"ุงูู",
"ุชุจูู",
"ุฑุงุฌู",
"ุฏู",
"ุนุงูุฒู",
"ู
ุฌููุฏ",
"ุดููู",
":)",
"EOS"
] | [
"ุงู+ู",
"ุชุจูู",
"ูุงุทู",
"ุฏู",
"ุญุงุฌ+ู",
"ุณูู+ู",
"ุงูู",
".",
".",
"ุจุณ",
"ุงู+ู",
"ุชุจูู",
"ุฑุงุฌู",
"ุฏู",
"ุนุงูุฒ+ู",
"ู
ุฌููุฏ",
"ุดูู+ู",
":)",
"EOS"
] | [
"PART+PRON",
"V",
"ADJ",
"PRON",
"NOUN+NSUFF",
"ADJ+NSUFF",
"ADJ",
"PUNC",
"PUNC",
"PART",
"PART+PRON",
"V",
"NOUN",
"PRON",
"ADJ+NSUFF",
"NOUN",
"NOUN+NSUFF",
"EMOT",
"EOS"
] |
2 | "A" | [
"ููู",
"ุงููุงุณ",
"ุจุชููู",
"ูุฃู",
"ุญุฏ",
"ูู",
"ุงูุดุงุฑุน",
"ูุงุจุดู
ููุฏุณ",
"ุ",
"ู
ุง",
"ุนุฏุง",
"ุงูู
ููุฏุณ",
"ูุนูุงู",
"ุจูููููุง",
"ูุงุฏูุชูุฑ",
"!",
"EOS"
] | [
"ููู",
"ุงู+ูุงุณ",
"ุจ+ุชููู",
"ู+ุฃู",
"ุญุฏ",
"ูู",
"ุงู+ุดุงุฑุน",
"ูุง+ุจุดู
ููุฏุณ",
"ุ",
"ู
ุง",
"ุนุฏุง",
"ุงู+ู
ููุฏุณ",
"ูุนู+ุง",
"ุจ+ูููู+ูุง",
"ูุง+ุฏูุชูุฑ",
"!",
"EOS"
] | [
"PART",
"DET+NOUN",
"PROG_PART+V",
"PREP+NOUN",
"NOUN",
"PREP",
"DET+NOUN",
"PART+NOUN",
"PUNC",
"PART",
"V",
"DET+NOUN",
"NOUN+CASE",
"PROG_PART+V+PRON",
"PART+NOUN",
"PUNC",
"EOS"
] |
3 | "A" | [
"ุฌุฉ",
"ุงูุฒู
ู",
"ุงููู",
"ุงููุงุณ",
"ุชุนู
ู",
"ุฌู
ุงูู",
"ูุจุนุถ",
"ุ",
"ุ",
"ุนุดุงู",
"ุชููุฑ",
"ุจุนุถ",
"ุจูุฉ",
".",
"EOS"
] | [
"ุฌุฉ",
"ุงู+ุฒู
ู",
"ุงููู",
"ุงู+ูุงุณ",
"ุชุนู
ู",
"ุฌู
ุงูู",
"ู+ุจุนุถ",
"ุ",
"ุ",
"ุนุดุงู",
"ุชููุฑ",
"ุจุนุถ",
"ุจู+ุฉ",
".",
"EOS"
] | [
"V",
"DET+NOUN",
"PART",
"DET+NOUN",
"V",
"NOUN",
"PREP+NOUN",
"PUNC",
"PUNC",
"PART",
"V",
"NOUN",
"PREP+PRON",
"PUNC",
"EOS"
] |
1 | "A" | [
"ุงูุง",
"ูุฑุจุช",
"ุงุชุฌูู",
"!",
"ุงูุง",
"ุจุญูู
",
"ุญุงุฌุงุช",
"ุจุชุชุญูู",
":(",
"ูุจููุฑ",
"ูู",
"ุญุงุฌุงุช",
"ู",
"ุฎูุงูู",
"ุจุฑุฏู",
"ุจุชุชุญูู",
"ู",
"ููุณ",
"ุงูููู
",
"!",
"ุงูุง",
"ุฎุงููู",
"-_-",
"EOS"
] | [
"ุงูุง",
"ูุฑุจ+ุช",
"ุงุชุฌูู",
"!",
"ุงูุง",
"ุจ+ุญูู
",
"ุญุงุฌ+ุงุช",
"ุจ+ุชุชุญูู",
":(",
"ู+ุจ+ููุฑ",
"ูู",
"ุญุงุฌ+ุงุช",
"ู",
"ุฎูุงู+ู",
"ุจุฑุฏู",
"ุจ+ุชุชุญูู",
"ู",
"ููุณ",
"ุงู+ููู
",
"!",
"ุงูุง",
"ุฎุงูู+ู",
"-_-",
"EOS"
] | [
"PRON",
"V+PRON",
"V",
"PUNC",
"PRON",
"PROG_PART+V",
"NOUN+NSUFF",
"PROG_PART+V",
"EMOT",
"CONJ+PROG_PART+V",
"PREP",
"NOUN+NSUFF",
"PREP",
"NOUN+PRON",
"ADV",
"PROG_PART+V",
"PREP",
"NOUN",
"DET+NOUN",
"PUNC",
"PRON",
"ADJ+NSUFF",
"EMOT",
"EOS"
] |
2 | "A" | [
"ุฃูุง",
"ู
ุด",
"ุณุงู
ุน",
"ูุต",
"ููุงู
",
"ุงููู",
"ุจูููู
ููู",
"ุ",
"ุจุณุจุจ",
"ุฏูุฑ",
"ุงูุจุฑุฏ",
"ุงููู",
"ุนูุฏู",
"ุ",
"ุจูุฒ",
"ุฏู
ุงุบู",
"ุฒู",
"ุงูุนุจูุท",
"ูุฃูู",
"ุณุงู
ุน",
"EOS"
] | [
"ุฃูุง",
"ู
ุด",
"ุณุงู
ุน",
"ูุต",
"ููุงู
",
"ุงููู",
"ุจ+ูููู
+ู+ูู",
"ุ",
"ุจ+ุณุจุจ",
"ุฏูุฑ",
"ุงู+ุจุฑุฏ",
"ุงููู",
"ุนูุฏ+ู",
"ุ",
"ุจ+ูุฒ",
"ุฏู
ุงุบ+ู",
"ุฒู",
"ุงู+ุนุจูุท",
"ูุฃู+ู",
"ุณุงู
ุน",
"EOS"
] | [
"PRON",
"PART",
"ADJ",
"NOUN",
"NOUN",
"PART",
"PROG_PART+V+PRON+PRON",
"PUNC",
"PREP+NOUN",
"NOUN",
"DET+NOUN",
"PART",
"NOUN+PRON",
"PUNC",
"PROG_PART+V",
"NOUN+PRON",
"NOUN",
"DET+ADJ",
"PART+PRON",
"ADJ",
"EOS"
] |
2 | "A" | [
"ุงููุงุณ",
"ู
ุด",
"ูุฏุฑุฉ",
"ุชููู
",
"ุฃู",
"ู
ููุด",
"ุญุงุฌุฉ",
"ุงุณู
ูุง",
"ุญุจ",
"ููุง",
"ูู",
"ุญุฏ",
"ุจูุญุจ",
"ุจุฌุฏ",
"ูุงูู",
"ุจุชุญุจู",
"ุจุฌุฏ",
"ุจูุณูุจู",
"ูุงูู",
"ุจูุญุจู",
"ุจุฌุฏ",
"ุจุชุณูุจู",
"ูุง",
"ุฑูุญ",
"ุจุงูู",
"ุฃุญุณู",
".",
"EOS"
] | [
"ุงู+ูุงุณ",
"ู
ุด",
"ูุฏุฑ+ุฉ",
"ุชููู
",
"ุฃู",
"ู
+ูู+ุด",
"ุญุงุฌ+ุฉ",
"ุงุณู
+ูุง",
"ุญุจ",
"ู+ูุง",
"ูู",
"ุญุฏ",
"ุจ+ูุญุจ",
"ุจ+ุฌุฏ",
"ู+ุงูู",
"ุจ+ุชุญุจ+ู",
"ุจ+ุฌุฏ",
"ุจ+ูุณูุจ+ู",
"ู+ุงูู",
"ุจ+ูุญุจ+ู",
"ุจ+ุฌุฏ",
"ุจ+ุชุณูุจ+ู",
"ูุง",
"ุฑูุญ",
"ุจุงู+ู",
"ุฃุญุณู",
".",
"EOS"
] | [
"DET+NOUN",
"PART",
"ADJ+NSUFF",
"V",
"PART",
"PART+PREP+NEG_PART",
"NOUN+NSUFF",
"NOUN+PRON",
"NOUN",
"CONJ+PART",
"PREP",
"NOUN",
"PROG_PART+V",
"PREP+NOUN",
"CONJ+PART",
"PROG_PART+V+PRON",
"PREP+NOUN",
"PROG_PART+V+PRON",
"CONJ+PART",
"PROG_PART+V+PRON",
"PREP+NOUN",
"PROG_PART+V+PRON",
"CONJ",
"V",
"NOUN+PRON",
"ADJ",
"PUNC",
"EOS"
] |
2 | "A" | [
"ููู",
"ูุงุณ",
"ูุฏู",
"ุจูุจูู",
"ุทูู",
"ุนูู
ุฑูู
",
"ู
ุนุฑูููู",
"ุจุฅุณู
ูู
",
"ูุฅุณู
",
"ุฃุจููู
",
"ููุฌุฃุฉ",
"ูุฏู",
"ุณูุจุญุงู",
"ุงููู",
"ุจูุทูุนููู
",
"ุฅุณู
",
"ุนููุฉ",
"ุฑููุด",
"ูููุถููุง",
"ููุฑููุง",
"ุงููู",
"ุฎูููููุง",
"ุจูู",
"EOS"
] | [
"ูู+ู",
"ูุงุณ",
"ูุฏู",
"ุจ+ูุจูู",
"ุทูู",
"ุนู
ุฑ+ูู
",
"ู
ุนุฑูู+ูู",
"ุจ+ุฅุณู
+ูู
",
"ู+ุฅุณู
",
"ุฃุจ+ู+ูู
",
"ู+ูุฌุฃ+ุฉ",
"ูุฏู",
"ุณุจุญุงู",
"ุงููู",
"ุจ+ูุทูุน+ู+ูู
",
"ุฅุณู
",
"ุนูู+ุฉ",
"ุฑูุด",
"ู+ููุถู+ูุง",
"ููุฑู+ูุง",
"ุงููู",
"ุฎูู+ู+ูุง",
"ุจู+ู",
"EOS"
] | [
"PREP+PRON",
"NOUN",
"ADV",
"PROG_PART+V",
"NOUN",
"NOUN+PRON",
"ADJ+NSUFF",
"PREP+NOUN+PRON",
"CONJ+NOUN",
"NOUN+CASE+PRON",
"CONJ+NOUN+NSUFF",
"ADV",
"NOUN",
"NOUN",
"PROG_PART+V+PREP+PRON",
"NOUN",
"NOUN+NSUFF",
"ADJ",
"CONJ+V+PRON",
"V+PRON",
"PART",
"V+PRON+PRON",
"PREP+PRON",
"EOS"
] |
4 | "A" | [
"ูู",
"ูู
ุง",
"ููุฏ",
"ูุจูุน",
"ุตุงุญุจู",
"ุนุดุงู",
"ุจูุช",
"ุจููููู",
"ู
ุด",
"ุฑุงุฌู",
"ุทูุจ",
"ู",
"ุงูุจูุช",
"ุงููู",
"ุจุชุจูุน",
"ุตุงุญุจุชูุง",
"ุนุดุงู",
"ููุฏ",
"ูุชูุงู",
"ุนูููุง",
"ุงูู",
"ุ",
"!",
"EOS"
] | [
"ูู",
"ูู
ุง",
"ููุฏ",
"ูุจูุน",
"ุตุงุญุจ+ู",
"ุนุดุงู",
"ุจูุช",
"ุจ+ูููู+ู",
"ู
ุด",
"ุฑุงุฌู",
"ุทูุจ",
"ู",
"ุงู+ุจูุช",
"ุงููู",
"ุจ+ุชุจูุน",
"ุตุงุญุจ+ุช+ูุง",
"ุนุดุงู",
"ููุฏ",
"ูุชูุงู",
"ุนูู+ูุง",
"ุงูู",
"ุ",
"!",
"EOS"
] | [
"PRON",
"PART",
"NOUN",
"V",
"NOUN+PRON",
"PART",
"NOUN",
"PROG_PART+V+PRON",
"PART",
"NOUN",
"ADJ",
"CONJ",
"DET+NOUN",
"PART",
"PROG_PART+V",
"NOUN+NSUFF+PRON",
"PART",
"NOUN",
"V",
"PREP+PRON",
"PART",
"PUNC",
"PUNC",
"EOS"
] |
4 | "A" | [
"ุนู
ุฑู",
"ูุณู",
"ู
ุฎุจู",
"ุญุงุฌุงุช",
"ุงูุชุฑ",
"ู
ู",
"ูุฏู",
"ู
ุณุชููุงู",
"ูุฑุจู",
"ุงููุฏ",
"ุดุงููู",
"ุฎูุฑ",
"ููุฌู",
"ูู",
"ููุชู",
"ูุงูุฏููุง",
"ุงููุฏ",
"ูููุง",
"ูุญุธุงุช",
"ุญููู",
"ูุชุนูุดูุง",
"ุ",
"ุจุณ",
"ููู",
"ูู",
"ููุชู",
".",
".",
"ุงุตุจุฑ",
"EOS"
] | [
"ุนู
ุฑ+ู",
"ูุณ+ู",
"ู
ุฎุจู",
"ุญุงุฌ+ุงุช",
"ุงูุชุฑ",
"ู
ู",
"ูุฏู",
"ู
ุณุชูู+ุง+ู",
"ู+ุฑุจ+ู",
"ุงููุฏ",
"ุดุงู+ู+ู",
"ุฎูุฑ",
"ู+ูุฌู",
"ูู",
"ููุช+ู",
"ู+ุงู+ุฏููุง",
"ุงููุฏ",
"ูู+ูุง",
"ูุญุธ+ุงุช",
"ุญูู+ู",
"ู+ุชุนูุด+ูุง",
"ุ",
"ุจุณ",
"ูู+ู",
"ูู",
"ููุช+ู",
".",
".",
"ุงุตุจุฑ",
"EOS"
] | [
"NOUN+PRON",
"ADV+NSUFF",
"ADJ",
"NOUN+NSUFF",
"ADJ",
"PREP",
"ADV",
"ADJ+NSUFF+PRON",
"CONJ+NOUN+PRON",
"ADJ",
"ADJ+PREP+PRON",
"NOUN",
"FUT_PART+V",
"PREP",
"NOUN+PRON",
"CONJ+DET+NOUN",
"ADJ",
"PREP+PRON",
"NOUN+NSUFF",
"ADJ+NSUFF",
"FUT_PART+V+PRON",
"PUNC",
"PART",
"NOUN+PRON",
"PREP",
"NOUN+PRON",
"PUNC",
"PUNC",
"V",
"EOS"
] |
2 | "A" | [
"ุฃุตู",
"ูู",
"ูุงุณ",
"ู
ุงุจุชุญุจุด",
"ุงูุชุฌุฏูุฏ",
".",
".",
"ุงูู",
"ุจูุชููู",
"ู
ู",
"ุงููุฑุจุงุฌ",
"ู
ู",
"ุฒู
ุงู",
".",
".",
"ุตุนุจ",
"ุงูู",
"ูุฌูู",
"ุนูู",
"ูุจุฑ",
".",
".",
"ูุบูุฑูุง",
"!",
"!",
"#ุญูููุฉ",
"#ุจุงุณู
_ููุณู",
"#ุฑุฌุนูุง_ุฌู
ุงููุฑ",
"EOS"
] | [
"ุฃุตู",
"ูู",
"ูุงุณ",
"ู
ุง+ุจ+ุชุญุจ+ุด",
"ุงู+ุชุฌุฏูุฏ",
".",
".",
"ุงูู",
"ุจ+ูุชููู",
"ู
ู",
"ุงู+ูุฑุจุงุฌ",
"ู
ู",
"ุฒู
ุงู",
".",
".",
"ุตุนุจ",
"ุงูู",
"ูุฌูู",
"ุนูู",
"ูุจุฑ",
".",
".",
"ูุบูุฑ+ูุง",
"!",
"!",
"#ุญูููุฉ",
"#ุจุงุณู
_ููุณู",
"#ุฑุฌุนูุง_ุฌู
ุงููุฑ",
"EOS"
] | [
"NOUN",
"PREP",
"NOUN",
"PART+PROG_PART+V+NEG_PART",
"DET+NOUN",
"PUNC",
"PUNC",
"PART",
"PROG_PART+V",
"PREP",
"DET+NOUN",
"PREP",
"NOUN",
"PUNC",
"PUNC",
"ADJ",
"ADJ",
"V",
"PREP",
"NOUN",
"PUNC",
"PUNC",
"V+PRON",
"PUNC",
"PUNC",
"HASH",
"HASH",
"HASH",
"EOS"
] |
2 | "A" | [
"ู
ุด",
"ุงู",
"ุญุฏ",
"ุจูุนุงู
ูู",
"ุญูู",
"ูุจูู",
"ุจูุญุจู",
"\"",
"ุงูู
ุตูุญุฉ",
"ุจุชุนู
ู",
"ูู",
"ุญุงุฌุฉ",
"\"",
"EOS"
] | [
"ู
ุด",
"ุงู",
"ุญุฏ",
"ุจ+ูุนุงู
ู+ู",
"ุญูู",
"ูุจูู",
"ุจ+ูุญุจ+ู",
"\"",
"ุงู+ู
ุตูุญ+ุฉ",
"ุจ+ุชุนู
ู",
"ูู",
"ุญุงุฌ+ุฉ",
"\"",
"EOS"
] | [
"PART",
"NOUN",
"NOUN",
"PROG_PART+V+PRON",
"ADJ",
"V",
"PROG_PART+V+PRON",
"PUNC",
"DET+NOUN+NSUFF",
"PROG_PART+V",
"NOUN",
"NOUN+NSUFF",
"PUNC",
"EOS"
] |
4 | "A" | [
"ู",
"ูู
ุง",
"ุชูุฌู",
"ุชูุงูุด",
"ุญุฏ",
"ู
ู",
"ุงูุฌูู",
"ุจุชุงุน",
"ุงูุนูุงุฌูุฒ",
"ูููููู",
"ู
ุด",
"ุงููู",
"ุจูุชูุจุถ",
"ุนูููู
",
"ุฏููู",
"ุจููุฑุฌ",
"ุนููู
",
"ูู",
"ู
ุธููู
",
"ููุทูุน",
"ูุงุจูู",
"ู
ุชุฎูุด",
"(",
"1",
")",
"EOS"
] | [
"ู",
"ูู
ุง",
"ุชูุฌู",
"ุชูุงูุด",
"ุญุฏ",
"ู
ู",
"ุงู+ุฌูู",
"ุจุชุงุน",
"ุงู+ุนูุงุฌูุฒ",
"ู+ููู+ู+ู",
"ู
ุด",
"ุงููู",
"ุจ+ูุชูุจุถ",
"ุนูู+ูู
",
"ุฏููู",
"ุจ+ููุฑุฌ",
"ุนู+ูู
",
"ูู",
"ู
ุธููู
",
"ู+ูุทูุน",
"ูุง+ุจู+ู",
"ู
+ุชุฎู+ุด",
"(",
"1",
")",
"EOS"
] | [
"CONJ",
"PART",
"V",
"V",
"NOUN",
"PREP",
"DET+NOUN",
"NOUN",
"DET+NOUN",
"FUT_PART+V+PREP+PRON",
"PART",
"PART",
"PROG_PART+V",
"PREP+PRON",
"PRON",
"PROG_PART+V",
"PREP+PRON",
"PART",
"ADJ",
"FUT_PART+V",
"PART+NOUN+PRON",
"PART+V+NEG_PART",
"PUNC",
"NUM",
"PUNC",
"EOS"
] |
1 | "A" | [
"ู",
"ูู
ุง",
"ูู",
"ู
ุธููู
",
"ุจูุชูุจุถ",
"ุนููู",
"ู
ู",
"ุงูุงูู",
"ูููู",
"ูุนูู",
"ุงูู",
"ุดุงุจ",
"ุงุจู",
"ูุงุณ",
"ู",
"ู
ุงููุด",
"ุฏุนูู",
"ุจุญุงุฌู",
"ูุชูุจุถ",
"ุนููู",
"ู",
"ูุฏุฎู",
"ุงูู
ุนุชูู",
"ูุนูู",
"ุงูู",
"ู
ุนุฏุด",
"ุญุฏ",
"ุจูู",
"ุจููุทู",
"(",
"2",
")",
"EOS"
] | [
"ู",
"ูู
ุง",
"ูู",
"ู
ุธููู
",
"ุจ+ูุชูุจุถ",
"ุนูู+ู",
"ู
ู",
"ุงู+ุงูู",
"ูููู",
"ูุนูู",
"ุงูู",
"ุดุงุจ",
"ุงุจู",
"ูุงุณ",
"ู",
"ู
ุง+ู+ู+ุด",
"ุฏุนู+ู",
"ุจ+ุญุงุฌ+ู",
"ูุชูุจุถ",
"ุนูู+ู",
"ู",
"ูุฏุฎู",
"ุงู+ู
ุนุชูู",
"ูุนูู",
"ุงูู",
"ู
+ุนุฏ+ุด",
"ุญุฏ",
"ุจูู",
"ุจ+ููุทู",
"(",
"2",
")",
"EOS"
] | [
"CONJ",
"PART",
"PRON",
"ADJ",
"PROG_PART+V",
"PREP+PRON",
"PREP",
"DET+NUM",
"PART",
"V",
"PART",
"NOUN",
"NOUN",
"NOUN",
"CONJ",
"PART+PREP+PRON+NEG_PART",
"NOUN+NSUFF",
"PREP+NOUN+NSUFF",
"V",
"PREP+PRON",
"CONJ",
"V",
"DET+NOUN",
"V",
"PART",
"PART+V+NEG_PART",
"NOUN",
"V",
"PROG_PART+V",
"PUNC",
"NUM",
"PUNC",
"EOS"
] |
2 | "A" | [
"ูู
ุง",
"ุฑูุญูุง",
"ุงูู
ูุชู
ุฑ",
"ุนุดุงู",
"ุตุญุงุจูุง",
".",
".",
"ุญุถุฑุงุช",
"ุงููุดุทุงุก",
"ูุงูู
ุญุงู
ููู",
"ู
ุงุฑุถููุด",
"ูุชููู
ู",
"ุนู",
"ู
ุนุชููู",
"ุงูู
ุนุงุฏู",
"ุนุดุงู",
"ูู
ุง",
"ู
ุฌููููู",
"ูู
ุด",
"ู
ุดููุฑูู",
"ูู
ุงูููู
ุด",
"ุถูุฑ",
"#ูุชุจุน",
"EOS"
] | [
"ูู
ุง",
"ุฑูุญ+ูุง",
"ุงู+ู
ูุชู
ุฑ",
"ุนุดุงู",
"ุตุญุงุจ+ูุง",
".",
".",
"ุญุถุฑ+ุงุช",
"ุงู+ูุดุทุงุก",
"ู+ุงู+ู
ุญุงู
ู+ูู",
"ู
ุง+ุฑุถู+ู+ุด",
"ูุชููู
+ู",
"ุนู",
"ู
ุนุชูู+ู",
"ุงู+ู
ุนุงุฏู",
"ุนุดุงู",
"ูู
ุง",
"ู
ุฌููู+ูู",
"ู+ู
ุด",
"ู
ุดููุฑ+ูู",
"ู+ู
ุง+ู+ููู
+ุด",
"ุถูุฑ",
"#ูุชุจุน",
"EOS"
] | [
"PART",
"V+PRON",
"DET+NOUN",
"PART",
"NOUN+PRON",
"PUNC",
"PUNC",
"NOUN+NSUFF",
"DET+NOUN",
"CONJ+DET+NOUN+NSUFF",
"PART+V+PRON+NEG_PART",
"V+PRON",
"PREP",
"NOUN+NSUFF",
"DET+NOUN",
"PART",
"PRON",
"ADJ+NSUFF",
"CONJ+PART",
"ADJ+NSUFF",
"CONJ+PART+PREP+PRON+NEG_PART",
"NOUN",
"HASH",
"EOS"
] |
1 | "A" | [
"ุงูููุงู
",
"ูู",
"ูุงู",
"ูุนุจุฑ",
"ุนู",
"ุงูุญูุงู",
"ููุช",
"ูููุช",
"ุงูู",
"ู
ุด",
"ุทุงููุฉ",
"ูุด",
"ุงู
ู",
"ู
ู",
"ุฒู
ุงู",
"EOS"
] | [
"ุงู+ููุงู
",
"ูู",
"ูุงู",
"ูุนุจุฑ",
"ุนู",
"ุงู+ุญูุงู",
"ูู+ุช",
"ููู+ุช",
"ุงู+ู",
"ู
ุด",
"ุทุงูู+ุฉ",
"ูุด",
"ุงู
+ู",
"ู
ู",
"ุฒู
ุงู",
"EOS"
] | [
"DET+NOUN",
"PART",
"V",
"V",
"PREP",
"DET+NOUN",
"V+PRON",
"V+PRON",
"PART+PRON",
"PART",
"ADJ+NSUFF",
"NOUN",
"NOUN+PRON",
"PREP",
"NOUN",
"EOS"
] |
2 | "A" | [
"ุงูููุช",
"ููุนูุฏู",
"ุนูู",
"ุญุงุฌุงุช",
"ูุชูุฑ",
"ู
ุชุฎููุชุด",
"ุงุจุฏุง",
"ุงูู",
"ุชุชุนูุฏ",
"ุนูููุง",
".",
".",
".",
".",
"ุจุณ",
"ู
ุด",
"ูููุฏุฑ",
"ููุณููุงูู",
"EOS"
] | [
"ุงู+ููุช",
"ู+ูุนูุฏ+ู",
"ุนูู",
"ุญุงุฌ+ุงุช",
"ูุชูุฑ",
"ู
+ุชุฎูู+ุช+ุด",
"ุงุจุฏ+ุง",
"ุงู+ู",
"ุชุชุนูุฏ",
"ุนูู+ูุง",
".",
".",
".",
".",
"ุจุณ",
"ู
ุด",
"ู+ููุฏุฑ",
"ููุณู+ูุง+ู+ู",
"EOS"
] | [
"DET+NOUN",
"FUT_PART+V+PRON",
"PREP",
"NOUN+NSUFF",
"ADJ",
"PART+V+PRON+NEG_PART",
"NOUN+CASE",
"PART+PRON",
"V",
"PREP+PRON",
"PUNC",
"PUNC",
"PUNC",
"PUNC",
"PART",
"PART",
"FUT_PART+V",
"V+PRON+PREP+PRON",
"EOS"
] |
4 | "B" | [
"ูู",
"ุฃูุณุงู",
"ุฌูุงู",
"ุญูุงูุฉ",
"ุฃู",
"ุณุจุจ",
"ุจูุชุญูู
ูุง",
"ูู",
"ุฃุณููุจ",
"ุญูุงุชู",
"ูุทุฑููุชู",
"ุ",
"ูุง",
"ู
ุงุชุญูู
ุด",
"ุนูู",
"ุญุฏ",
"ู
ู",
"ุงูุธุงูุฑ",
".",
".",
"ุญูู",
"ูุฃููู
",
"ุงูุฃุณุจุงุจ",
"ุณุงุนุชูุง",
"ู
ู
ูู",
"ุชูุงูู",
"ูู",
"ู
ูููู",
"ุนุฐุฑ",
".",
"EOS"
] | [
"ูู",
"ุฃูุณุงู",
"ุฌู+ุง+ู",
"ุญูุงู+ุฉ",
"ุฃู",
"ุณุจุจ",
"ุจ+ูุชุญูู
+ูุง",
"ูู",
"ุฃุณููุจ",
"ุญูุง+ุช+ู",
"ู+ุทุฑูู+ุช+ู",
"ุ",
"ูุง",
"ู
ุง+ุชุญูู
+ุด",
"ุนูู",
"ุญุฏ",
"ู
ู",
"ุงู+ุธุงูุฑ",
".",
".",
"ุญูู",
"ู+ุฃููู
",
"ุงู+ุฃุณุจุงุจ",
"ุณุงุน+ุช+ูุง",
"ู
ู
ูู",
"ุชูุงูู",
"ู+ู",
"ู
ูููู",
"ุนุฐุฑ",
".",
"EOS"
] | [
"NOUN",
"NOUN",
"NOUN+NSUFF+PRON",
"NOUN+NSUFF",
"CONJ",
"NOUN",
"PROG_PART+V+PRON",
"PREP",
"NOUN",
"NOUN+NSUFF+PRON",
"CONJ+NOUN+NSUFF+PRON",
"PUNC",
"CONJ",
"PART+V+NEG_PART",
"PREP",
"NOUN",
"PREP",
"DET+ADJ",
"PUNC",
"PUNC",
"V",
"CONJ+V",
"DET+NOUN",
"NOUN+NSUFF+PRON",
"ADJ",
"V",
"PREP+PRON",
"NUM",
"NOUN",
"PUNC",
"EOS"
] |
4 | "B" | [
"ุณุงุนุงุช",
"ูุชูุฑ",
"ู
ุจุชุจูุงุด",
"ุนุงุฑู",
"ุฃูุช",
"ุจุชุญุณ",
"ุฅูู",
"ูุงุญูุชูู
",
"ููุง",
"ูู
ุง",
"ุจุงููุณุจุงูู",
"ุฅูู",
"ุ",
"ุ",
"ุ",
"ุจุณ",
"ุจุชุญุจ",
"ุชุชููู
",
"ู
ุนุงูู
",
"ูู",
"ููู
",
"EOS"
] | [
"ุณุงุน+ุงุช",
"ูุชูุฑ",
"ู
+ุจ+ุชุจูุง+ุด",
"ุนุงุฑู",
"ุฃูุช",
"ุจ+ุชุญุณ",
"ุฅูู",
"ูุงุญู+ุช+ูู
",
"ู+ูุง",
"ูู
ุง",
"ุจ+ุงู+ูุณุจ+ุง+ู+ู",
"ุฅูู",
"ุ",
"ุ",
"ุ",
"ุจุณ",
"ุจ+ุชุญุจ",
"ุชุชููู
",
"ู
ุนุง+ูู
",
"ูู",
"ููู
",
"EOS"
] | [
"NOUN+NSUFF",
"ADJ",
"PART+PROG_PART+V+NEG_PART",
"ADJ",
"PRON",
"PROG_PART+V",
"PART",
"NOUN+NSUFF+PRON",
"CONJ+PART",
"PRON",
"PREP+DET+NOUN+NSUFF+PREP+PRON",
"PART",
"PUNC",
"PUNC",
"PUNC",
"PART",
"PROG_PART+V",
"V",
"NOUN+PRON",
"NOUN",
"NOUN",
"EOS"
] |
3 | "B" | [
"ูู",
"ุนุดุงู",
"ู
ุด",
"ุจุณุงู",
"ูุจูู",
"ู
ุด",
"ู
ูุชู
ุฉ",
"ู
ุด",
"ู
ู
ูู",
"ูุนูู",
"ุงููู",
"ู
ุด",
"ุนุงุฑูุฉ",
"ุงุชุงููู
",
"ุนู",
"ุฌู",
"ุฏู",
"ุงู",
"ู
ุด",
"ุนุงูุฒุฉ",
"ูุชุนุงู
ู",
"ูุฏุฉ",
"EOS"
] | [
"ูู",
"ุนุดุงู",
"ู
ุด",
"ุจ+ุณุงู",
"ูุจูู",
"ู
ุด",
"ู
ูุชู
+ุฉ",
"ู
ุด",
"ู
ู
ูู",
"ูุนูู",
"ุงููู",
"ู
ุด",
"ุนุงุฑู+ุฉ",
"ุงุชุงููู
",
"ุน+ู",
"ุฌู",
"ุฏู",
"ุงู",
"ู
ุด",
"ุนุงูุฒ+ุฉ",
"ูุชุนุงู
ู",
"ูุฏุฉ",
"EOS"
] | [
"PRON",
"PART",
"PART",
"PROG_PART+V",
"V",
"PART",
"ADJ+NSUFF",
"PART",
"ADJ",
"ADV",
"V",
"PART",
"ADJ+NSUFF",
"V",
"PREP+DET",
"NOUN",
"PRON",
"CONJ",
"PART",
"ADJ+NSUFF",
"V",
"ADV",
"EOS"
] |
5 | "B" | [
"ูุงูุง",
"ูุงุนุฏ",
"ุจุตูู",
"ูู",
"ุงูุญุฑู
",
"ูุงุญุฏ",
"ู
ุตุฑู",
"ุจูุตูู",
"ุฌูุจู",
"ุจุนุฏ",
"ู
ุง",
"ุฎูุตูุง",
"ุจููููู",
"ุญุฑู
ุง",
"ูููุชูู",
"ุฃูุชุฑ",
"ู
ู",
"ูุฏู",
"!",
":D",
"EOS"
] | [
"ู+ุงูุง",
"ูุงุนุฏ",
"ุจ+ุตูู",
"ูู",
"ุงู+ุญุฑู
",
"ูุงุญุฏ",
"ู
ุตุฑู",
"ุจ+ูุตูู",
"ุฌูุจ+ู",
"ุจุนุฏ",
"ู
ุง",
"ุฎูุต+ูุง",
"ุจ+ููู+ู+ู",
"ุญุฑู
+ุง",
"ููู+ุช+ู+ู",
"ุฃูุชุฑ",
"ู
ู",
"ูุฏู",
"!",
":D",
"EOS"
] | [
"CONJ+PRON",
"ADJ",
"PROG_PART+V",
"PREP",
"DET+NOUN",
"NOUN",
"ADJ",
"PROG_PART+V",
"NOUN+PRON",
"NOUN",
"PART",
"V+PRON",
"PROG_PART+V+PREP+PRON",
"NOUN+CASE",
"V+PRON+PREP+PRON",
"ADJ",
"PREP",
"ADV",
"PUNC",
"EMOT",
"EOS"
] |
5 | "B" | [
"ูุจูู",
"ู
ุชูู
ูุด",
"ูุฎููู",
"ูุงุนุฏู",
"ูุงุณูุฑู",
"ุจุฑุฏูู",
"ูุญุฏ",
"ู
ุชูุตูู",
"ุฎุงูุต",
"ุจุนุฏ",
"ูุฏู",
"ูุงู
ู",
"ุจููู",
"@sarrahsherrif",
"EOS"
] | [
"ูุจูู",
"ู
+ุชูู
+ู+ุด",
"ู+ุฎู+ู+ู",
"ูุงุนุฏ+ู",
"ู+ุงุณูุฑ+ู",
"ุจุฑุฏูู",
"ู+ุญุฏ",
"ู
+ุชูุตู+ู",
"ุฎุงูุต",
"ุจุนุฏ",
"ูุฏู",
"ูุงู
+ู",
"ุจ+ู+ูู",
"@sarrahsherrif",
"EOS"
] | [
"V",
"PART+V+PRON+NEG_PART",
"CONJ+V+PRON+PRON",
"ADJ+NSUFF",
"CONJ+V+NSUFF",
"ADV",
"PREP+NOUN",
"PART+V+PRON",
"ADV",
"NOUN",
"ADV",
"V+PRON",
"PREP+DET+NOUN",
"MENTION",
"EOS"
] |
3 | "B" | [
"ุฃุญูู",
"ุฃููุฉ",
"ูู",
"ุงููู",
"ุจุชุงูููุง",
"ู",
"ุฃูุช",
"ู
ูุช",
"ู
ู",
"ุงูุฌูุน",
".",
".",
".",
"ุฃุญูู",
"ุดุฑุจ",
"ู",
"ุฃูุช",
"ู
ูุช",
"ู
ู",
"ุงูุนุทุด",
"ู",
"ุฃุญูู",
"ูุฑุญุฉ",
"ุญุชูุฌู",
"ู",
"ุฃูุช",
"ู
ูุช",
"ู
ู",
"ุงููุฃุณ",
"!",
"!",
"ูุฅุทู
ู",
"EOS"
] | [
"ุฃุญูู",
"ุฃูู+ุฉ",
"ูู",
"ุงููู",
"ุจ+ุชุงูู+ูุง",
"ู",
"ุฃูุช",
"ู
ูุช",
"ู
ู",
"ุงู+ุฌูุน",
".",
".",
".",
"ุฃุญูู",
"ุดุฑุจ",
"ู",
"ุฃูุช",
"ู
ูุช",
"ู
ู",
"ุงู+ุนุทุด",
"ู",
"ุฃุญูู",
"ูุฑุญ+ุฉ",
"ุญ+ุชูุฌู",
"ู",
"ุฃูุช",
"ู
ูุช",
"ู
ู",
"ุงู+ูุฃุณ",
"!",
"!",
"ู+ุฅุทู
ู",
"EOS"
] | [
"ADJ",
"NOUN+NSUFF",
"PRON",
"PART",
"PROG_PART+V+PRON",
"CONJ",
"PRON",
"ADJ",
"PREP",
"DET+NOUN",
"PUNC",
"PUNC",
"PUNC",
"NOUN",
"NOUN",
"CONJ",
"PRON",
"ADJ",
"PREP",
"DET+NOUN",
"CONJ",
"ADJ",
"NOUN+NSUFF",
"FUT_PART+V",
"CONJ",
"PRON",
"ADJ",
"PREP",
"DET+NOUN",
"PUNC",
"PUNC",
"CONJ+V",
"EOS"
] |
1 | "B" | [
"ูู",
"ูุงุณ",
"ูุฏุง",
"ูุงูุฑุฉ",
"ุงููู
",
"ุงููู",
"ู
ู",
"ุญููู
",
"ุจุณ",
"ูุฒุนููุง",
"ูุงู",
"ูู",
"ุงููุงุณ",
"ุฃุชุฎูููุง",
"ุนูุดุงู",
"ูุตูุญููู
",
"-_-",
"!",
"!",
"EOS"
] | [
"ูู",
"ูุงุณ",
"ูุฏุง",
"ูุงูุฑ+ุฉ",
"ุงู+ูู
",
"ุงููู",
"ู
ู",
"ุญู+ูู
",
"ุจุณ",
"ูุฒุนู+ูุง",
"ู+ุงู",
"ูู",
"ุงู+ูุงุณ",
"ุฃุชุฎูู+ูุง",
"ุนูุดุงู",
"ูุตูุญ+ู+ูู
",
"-_-",
"!",
"!",
"EOS"
] | [
"PREP",
"NOUN",
"ADV",
"ADJ+NSUFF",
"PART+PRON",
"PART",
"PREP",
"NOUN+PRON",
"ADV",
"V+PRON",
"CONJ+PART",
"NOUN",
"DET+NOUN",
"V+PRON",
"PART",
"V+PRON+PRON",
"EMOT",
"PUNC",
"PUNC",
"EOS"
] |
4 | "B" | [
"ุงููู",
"ู
ุจุณูุทูู",
"ูู",
"ุญูุงุชููู
",
"ู",
"ุฑุงุถููู",
"ุนูู",
"ูุฑุงุฑุชูู
",
"ุจููุง",
"ูููููู",
"ูู",
"ุงูุฒู
ู",
"ุฏู",
"EOS"
] | [
"ุงููู",
"ู
ุจุณูุท+ูู",
"ูู",
"ุญูุง+ุชู+ูู
",
"ู",
"ุฑุงุถู+ูู",
"ุนูู",
"ูุฑุงุฑ+ุช+ูู
",
"ุจู+ูุง",
"ูููู+ูู",
"ูู",
"ุงู+ุฒู
ู",
"ุฏู",
"EOS"
] | [
"PART",
"ADJ+NSUFF",
"PREP",
"NOUN+NSUFF+PRON",
"CONJ",
"ADJ+NSUFF",
"PREP",
"NOUN+NSUFF+PRON",
"V+PRON",
"ADJ+NSUFF",
"PREP",
"DET+NOUN",
"PRON",
"EOS"
] |
4 | "B" | [
"ุงูุบูุท",
"ู
ููุง",
"ูู
ุง",
"ูููู
",
"ุญุฏ",
"ู",
"ููุชู
",
"ุจูู",
"ุฌุงู
ุฏ",
".",
"ู",
"ุณุงุนุงุช",
"ุจูุญุจู",
"ุ",
"ุจุณ",
"ุจุชุจูู",
"ุนุงูุฒ",
"ุชูููู",
"ุงูุง",
"ุงุณู",
"ุงูู",
"ุญุจูุชู",
".",
"EOS"
] | [
"ุงู+ุบูุท",
"ู
ู+ูุง",
"ูู
ุง",
"ูููู
",
"ุญุฏ",
"ู",
"ููุชู
",
"ุจู+ู",
"ุฌุงู
ุฏ",
".",
"ู",
"ุณุงุน+ุงุช",
"ุจ+ูุญุจ+ู",
"ุ",
"ุจุณ",
"ุจ+ุชุจูู",
"ุนุงูุฒ",
"ุชูู+ู+ู",
"ุงูุง",
"ุงุณู",
"ุงู+ู",
"ุญุจ+ูุช+ู",
".",
"EOS"
] | [
"DET+NOUN",
"PREP+PRON",
"PART",
"V",
"NOUN",
"CONJ",
"V",
"PREP+PRON",
"ADJ",
"PUNC",
"CONJ",
"NOUN+NSUFF",
"PROG_PART+V+PRON",
"PUNC",
"PART",
"PROG_PART+V",
"ADJ",
"V+PREP+PRON",
"PRON",
"ADJ",
"PART+PRON",
"V+PRON+PRON",
"PUNC",
"EOS"
] |
4 | "B" | [
"ุงูุงุญุชุฑุงู
",
"ู
ุด",
"ู
ููุงุณ",
"ููุญุจ",
".",
".",
"ู
ู
ูู",
"ุงููู",
"ุจุญุชุฑู
ู",
"ุจุณ",
"ุจูุฑูู",
"ุนุงุฏู",
"EOS"
] | [
"ุงู+ุงุญุชุฑุงู
",
"ู
ุด",
"ู
ููุงุณ",
"ู+ุงู+ุญุจ",
".",
".",
"ู
ู
ูู",
"ุงููู",
"ุจ+ุญุชุฑู
+ู",
"ุจุณ",
"ุจ+ูุฑู+ู",
"ุนุงุฏู",
"EOS"
] | [
"DET+NOUN",
"PART",
"NOUN",
"PREP+DET+NOUN",
"PUNC",
"PUNC",
"ADJ",
"V",
"PROG_PART+V+PRON",
"PART",
"PROG_PART+V+PRON",
"ADJ",
"EOS"
] |
5 | "B" | [
"ู
ุงูู",
"ู
ููุด",
"#ู
ุณุฎุฑู",
"ุงูุชุฑ",
"ู
ู",
"ุงูู",
"ุชูุงูู",
"#ุจูุช",
"ุจุชุตูู",
"#ุงุณุชุฎุงุฑู",
"ุนุดุงู",
"ู
ุญุชุงุฑู",
"ุชุตุงุญุจ",
"#ุงุฏูู
",
"ููุง",
"#ุนู
ุฑ",
"!",
"EOS"
] | [
"ู
ุง+ูู",
"ู
+ูู+ุด",
"#ู
ุณุฎุฑู",
"ุงูุชุฑ",
"ู
ู",
"ุงู+ู",
"ุชูุงูู",
"#ุจูุช",
"ุจ+ุชุตูู",
"#ุงุณุชุฎุงุฑู",
"ุนุดุงู",
"ู
ุญุชุงุฑ+ู",
"ุชุตุงุญุจ",
"#ุงุฏูู
",
"ู+ูุง",
"#ุนู
ุฑ",
"!",
"EOS"
] | [
"PART+PRON",
"PART+PREP+NEG_PART",
"HASH",
"ADJ",
"PREP",
"PART+PRON",
"V",
"HASH",
"PROG_PART+V",
"HASH",
"PART",
"ADJ+NSUFF",
"V",
"HASH",
"CONJ+PART",
"HASH",
"PUNC",
"EOS"
] |
4 | "B" | [
"@Osamawad_4",
"ู
ุด",
"ุนุงุฑูุฉ",
"ู
ู
ูู",
".",
"ุงูุง",
"ู
ุง",
"ู
ุฑุชุด",
"ุจุงูู
ูุถูุน",
"ุฏู",
".",
"ู
ูููู",
"ู
ุญุฏุฏ",
"ู",
"ุซุงุจุช",
"ู",
"ุงูุญู
ุฏ",
"ููู",
"ุทูุนุช",
"ุตุญ",
"!",
"!",
"ุญุจ",
"ุงููุทู",
"ู
ููููุด",
"ูุบูุท",
"ู",
"ูุตูุญ",
".",
"EOS"
] | [
"@Osamawad_4",
"ู
ุด",
"ุนุงุฑู+ุฉ",
"ู
ู
ูู",
".",
"ุงูุง",
"ู
ุง",
"ู
ุฑ+ุช+ุด",
"ุจ+ุงู+ู
ูุถูุน",
"ุฏู",
".",
"ู
ููู+ู",
"ู
ุญุฏุฏ",
"ู",
"ุซุงุจุช",
"ู",
"ุงู+ุญู
ุฏ",
"ู+ุงููู",
"ุทูุน+ุช",
"ุตุญ",
"!",
"!",
"ุญุจ",
"ุงู+ูุทู",
"ู
+ูู+ูู+ุด",
"ูุบูุท",
"ู",
"ูุตูุญ",
".",
"EOS"
] | [
"MENTION",
"PART",
"ADJ+NSUFF",
"ADJ",
"PUNC",
"PRON",
"PART",
"V+PRON+NEG_PART",
"PREP+DET+NOUN",
"PRON",
"PUNC",
"NOUN+PRON",
"ADJ",
"CONJ",
"ADJ",
"CONJ",
"DET+NOUN",
"PREP+NOUN",
"V+PRON",
"NOUN",
"PUNC",
"PUNC",
"NOUN",
"DET+NOUN",
"PART+PREP+PRON+NEG_PART",
"V",
"CONJ",
"V",
"PUNC",
"EOS"
] |
1 | "B" | [
"ุงูุง",
"ูู
ุง",
"ุฃู
ูุช",
"ู
ุด",
"ูู
ูุช",
"ู
ู",
"ุงูู
ุฑุถ",
"ุจุชุงุนู",
"ุฃูุง",
"ูู
ุง",
"ุฃู
ูุช",
"ูู
ูุช",
"ู
ู",
"ุงูู
ุฑุถ",
"ุงููู",
"ุนูุฏููุง",
"ุฃูุชูุง",
"EOS"
] | [
"ุงูุง",
"ูู
ุง",
"ุฃู
ูุช",
"ู
ุด",
"ู+ู
ูุช",
"ู
ู",
"ุงู+ู
ุฑุถ",
"ุจุชุงุน+ู",
"ุฃูุง",
"ูู
ุง",
"ุฃู
ูุช",
"ู+ู
ูุช",
"ู
ู",
"ุงู+ู
ุฑุถ",
"ุงููู",
"ุนูุฏ+ููุง",
"ุฃูุชูุง",
"EOS"
] | [
"PRON",
"PART",
"V",
"PART",
"FUT_PART+V",
"PREP",
"DET+NOUN",
"NOUN+PRON",
"PRON",
"PART",
"V",
"FUT_PART+V",
"PREP",
"DET+NOUN",
"PART",
"NOUN+PRON",
"PRON",
"EOS"
] |
2 | "B" | [
"@lovly_y@Nour51728751",
"ุงููู",
"ูุงูุนูู",
"ุงูู",
"ูู
ุงู",
"ูุงุจุณ",
"ุงูุณุงุนุฉ",
"(",
"ุงููู",
"ูู",
"ู
ุด",
"ุงูู
ูุฌุง",
")",
"ูู",
"ุงูุฏู",
"ุงููู
ูู",
"-",
"ูุงุนููู",
"ุนูู",
"ุงููุฑุน",
"EOS"
] | [
"@lovly_y@Nour51728751",
"ุงููู",
"ูุงูุน+ูู",
"ุงู+ู",
"ูู
ุงู",
"ูุงุจุณ",
"ุงู+ุณุงุน+ุฉ",
"(",
"ุงููู",
"ูู",
"ู
ุด",
"ุงูู
ูุฌุง",
")",
"ูู",
"ุงูุฏ+ู",
"ุงู+ูู
ูู",
"-",
"ูุง+ุนูู+ู",
"ุนูู",
"ุงู+ูุฑุน",
"EOS"
] | [
"MENTION",
"PART",
"ADJ+PRON",
"PART+PRON",
"ADV",
"ADJ",
"DET+NOUN+NSUFF",
"PUNC",
"PART",
"PRON",
"PART",
"NOUN",
"PUNC",
"PREP",
"NOUN+PRON",
"DET+NOUN",
"PUNC",
"PART+NOUN+PRON",
"PREP",
"DET+NOUN",
"EOS"
] |
5 | "B" | [
"ุนุงุฑูุฉ",
"ุงุญุณุงุณ",
"ุงูู",
"ุจูุชูุฑ",
"ููุงู
ู",
"ุงููุญุด",
"ุงุจูู",
"ู
ุด",
"ุทุงูู",
"ุงุดููู",
"ู",
"ุงูุชูุฑ",
"ุถุญูุชู",
"ุงูุญููุฉ",
"ูุง",
"ุชูุญุดููู",
"!",
"EOS"
] | [
"ุนุงุฑู+ุฉ",
"ุงุญุณุงุณ",
"ุงู+ู",
"ุจ+ูุชูุฑ",
"ููุงู
+ู",
"ุงู+ูุญุด",
"ุงุจูู",
"ู
ุด",
"ุทุงูู",
"ุงุดูู+ู",
"ู",
"ุงูุชูุฑ",
"ุถุญู+ุช+ู",
"ุงู+ุญูู+ุฉ",
"ูุง",
"ุชูุญุด+ู+ูู",
"!",
"EOS"
] | [
"ADJ+NSUFF",
"NOUN",
"PART+PRON",
"PROG_PART+V",
"NOUN+PRON",
"DET+ADJ",
"V",
"PART",
"ADJ",
"V+PRON",
"CONJ",
"V",
"NOUN+NSUFF+PRON",
"DET+ADJ+NSUFF",
"CONJ",
"V+PRON+PRON",
"PUNC",
"EOS"
] |
4 | "B" | [
"ูู",
"ู
ููุชุด",
"ูุชุฎูู",
"ุนูู",
"ุชุนุฑู",
"ุชุฑุจูู",
"ุตุญ",
"ูุจูู",
"ุจูุงุด",
"ุชูุฑู",
"ุงูู
ุฌุชู
ุน",
"ุจุนูุงู",
"ุฒูุงุฏู",
"ุนุฏุฏ",
"ูุฎูุงุต",
".",
".",
".",
"EOS"
] | [
"ูู",
"ู
+ูู+ุช+ุด",
"ู+ุชุฎูู",
"ุนูู",
"ุชุนุฑู",
"ุชุฑุจู+ู",
"ุตุญ",
"ูุจูู",
"ุจูุงุด",
"ุชูุฑู",
"ุงู+ู
ุฌุชู
ุน",
"ุจ+ุนูุงู",
"ุฒูุงุฏ+ู",
"ุนุฏุฏ",
"ู+ุฎูุงุต",
".",
".",
".",
"EOS"
] | [
"PART",
"PART+V+PRON+NEG_PART",
"FUT_PART+V",
"NOUN",
"V",
"V+PRON",
"NOUN",
"V",
"PART",
"V",
"DET+NOUN",
"PREP+NOUN",
"NOUN+NSUFF",
"NOUN",
"CONJ+NOUN",
"PUNC",
"PUNC",
"PUNC",
"EOS"
] |
2 | "B" | [
"ุงูุนูุงุฏุงุช",
"ุงูููุงุฑุฏุฉ",
"ูุงูุช",
"ุฌุงู
ุฏุฉ",
"ุฌุฏุง",
"ูุงูุงุถุฑุงุจ",
"ูุงู",
"ูุงูู",
"ุงูุญูููุฉ",
"ูู",
"ู
ุณุชุดูู",
"ุฑุงุณ",
"ุงูุชูู",
"ุงูุนุงู
",
"EOS"
] | [
"ุงู+ุนูุงุฏ+ุงุช",
"ุงู+ููุงุฑุฏ+ุฉ",
"ูุงู+ุช",
"ุฌุงู
ุฏ+ุฉ",
"ุฌุฏ+ุง",
"ู+ุงู+ุงุถุฑุงุจ",
"ูุงู",
"ูุงูู",
"ุงู+ุญููู+ุฉ",
"ูู",
"ู
ุณุชุดูู",
"ุฑุงุณ",
"ุงู+ุชูู",
"ุงู+ุนุงู
",
"EOS"
] | [
"DET+NOUN+NSUFF",
"DET+NOUN+NSUFF",
"V+PRON",
"ADJ+NSUFF",
"NOUN+CASE",
"CONJ+DET+NOUN",
"V",
"ADJ",
"DET+NOUN+NSUFF",
"PREP",
"NOUN",
"NOUN",
"DET+NOUN",
"DET+ADJ",
"EOS"
] |
3 | "B" | [
"ุนูุฏู",
"ุญุฏ",
"ุจููุชู
",
"ุจูู",
"ู",
"ุจูุฎุงู",
"ุนููู",
"ุทุจ",
"ุฎูู",
"ุจุงูู",
"ู
ูู",
"ุจูุง",
"ุนุดุงู",
"ุฏู",
"ู
ููุด",
"ู
ูู",
"ูุชูุฑ",
"ุฃู",
"ู
ููุด",
"ู
ูู",
"ุฃุตูู",
"#ุญููููุฉ",
"EOS"
] | [
"ุนูุฏ+ู",
"ุญุฏ",
"ุจ+ููุชู
",
"ุจู+ู",
"ู",
"ุจ+ูุฎุงู",
"ุนูู+ู",
"ุทุจ",
"ุฎู+ู",
"ุจุงู+ู",
"ู
ู+ู",
"ุจูุง",
"ุนุดุงู",
"ุฏู",
"ู
+ูู+ุด",
"ู
ู+ู",
"ูุชูุฑ",
"ุฃู",
"ู
+ูู+ุด",
"ู
ู+ู",
"ุฃุตู+ู",
"#ุญููููุฉ",
"EOS"
] | [
"NOUN+PRON",
"NOUN",
"PROG_PART+V",
"PREP+PRON",
"CONJ",
"PROG_PART+V",
"PREP+PRON",
"ADJ",
"V+PRON",
"NOUN+PRON",
"PREP+PRON",
"ADV",
"PART",
"PRON",
"PART+PREP+NEG_PART",
"PREP+PRON",
"ADJ",
"CONJ",
"PART+PREP+NEG_PART",
"PREP+PRON",
"NOUN+CASE",
"HASH",
"EOS"
] |
2 | "B" | [
"ุชุญูุฉ",
"ููู",
"ูุงุญุฏ",
"ูุจุฑ",
"ุงูููุงุฑุฏุฉ",
"ูู
ุงูุฒูุด",
"ุ",
"ุชูุฒู",
"ุงูู",
"ููู
",
"!",
"!",
"ุฏุฉ",
"ุญุชู",
"ูุญุดุฉ",
"ูู
ุง",
"ุชุชูุชุจ",
"ูู",
"ุงู",
"CV",
".",
"EOS"
] | [
"ุชุญู+ุฉ",
"ู+ูู",
"ูุงุญุฏ",
"ูุจุฑ",
"ุงู+ููุงุฑุฏ+ุฉ",
"ู+ู
ุง+ูุฒู+ุด",
"ุ",
"ุชูุฒู",
"ุงูู",
"ููู
",
"!",
"!",
"ุฏุฉ",
"ุญุชู",
"ูุญุด+ุฉ",
"ูู
ุง",
"ุชุชูุชุจ",
"ูู",
"ุงู",
"CV",
".",
"EOS"
] | [
"NOUN+NSUFF",
"PREP+NOUN",
"NOUN",
"V",
"DET+NOUN+NSUFF",
"CONJ+PART+V+NEG_PART",
"PUNC",
"V",
"NUM",
"NOUN",
"PUNC",
"PUNC",
"PRON",
"PART",
"ADJ+NSUFF",
"PART",
"V",
"PREP",
"DET",
"FOREIGN",
"PUNC",
"EOS"
] |
4 | "B" | [
"ุฅูุช",
"ู
ุนุตูู
",
"ู
ู",
"ุงูุบูุท",
"ุ",
"!",
"ูุงุก",
"ุ",
"!",
"ุทุจ",
"ููู",
"ุจูู",
"ุจุชุญุณุณูู",
"ูู
ุง",
"ุจุบูุท",
"ุฅู",
"ุฏู",
"ููุงูุฉ",
"ุงูุนุงูู
",
"ูุนูู",
"!",
"EOS"
] | [
"ุฅูุช",
"ู
ุนุตูู
",
"ู
ู",
"ุงู+ุบูุท",
"ุ",
"!",
"ูุงุก",
"ุ",
"!",
"ุทุจ",
"ููู",
"ุจูู",
"ุจ+ุชุญุณุณ+ูู",
"ูู
ุง",
"ุจ+ุบูุท",
"ุฅู",
"ุฏู",
"ููุงู+ุฉ",
"ุงู+ุนุงูู
",
"ูุนูู",
"!",
"EOS"
] | [
"PRON",
"ADJ",
"PREP",
"DET+NOUN",
"PUNC",
"PUNC",
"PART",
"PUNC",
"PUNC",
"ADJ",
"PART",
"ADV",
"PROG_PART+V+PRON",
"PART",
"PROG_PART+V",
"PART",
"PRON",
"NOUN+NSUFF",
"DET+NOUN",
"ADV",
"PUNC",
"EOS"
] |
4 | "B" | [
"ุจููุถู",
"ูููู",
"ูููุงุณ",
"ู
ุงููุด",
"ุญุงุฌุฉ",
"ุชุณุชุงูู",
"ูุงูู
ูุฑูุถ",
"ูููู",
"ูููุณูุง",
"ุงูุฃูู",
".",
"EOS"
] | [
"ุจ+ููุถู",
"ูููู",
"ู+ุงู+ูุงุณ",
"ู
ุง+ูู+ุด",
"ุญุงุฌ+ุฉ",
"ุชุณุชุงูู",
"ู+ุงู+ู
ูุฑูุถ",
"ูููู",
"ู+ููุณ+ูุง",
"ุงู+ุฃูู",
".",
"EOS"
] | [
"PROG_PART+V",
"V",
"PREP+DET+NOUN",
"PART+PREP+NEG_PART",
"NOUN+NSUFF",
"V",
"CONJ+DET+ADJ",
"V",
"PREP+NOUN+PRON",
"DET+NUM",
"PUNC",
"EOS"
] |
2 | "B" | [
"ุฃูู",
"ุงูุฏูุชูุฑ",
"ุจุชุงุน",
"ุงูุฅุณูุงู",
"ุจูููู",
"ุฃู",
"ุงูุบูุฑ",
"ู
ุชุฒูุฌูู",
"ุจูุนู
ููุง",
"ุฃุฒู
ุฉ",
"ุณูุงููุฉ",
"ุ",
"ูุฃูุง",
"ููู",
"ุฌูุจ",
"ู
ุตุฑ",
"ููุณุงุนุฏ",
"ูู",
"ุญู",
"ุงูู
ุดููุฉ",
"ุ",
"ุฌูุฒููุง",
"ุจูู",
"EOS"
] | [
"ุฃูู",
"ุงู+ุฏูุชูุฑ",
"ุจุชุงุน",
"ุงู+ุฅุณูุงู",
"ุจ+ูููู",
"ุฃู",
"ุงู+ุบูุฑ",
"ู
ุชุฒูุฌ+ูู",
"ุจ+ูุนู
ู+ูุง",
"ุฃุฒู
+ุฉ",
"ุณูุงูู+ุฉ",
"ุ",
"ู+ุฃูุง",
"ู+ูู",
"ุฌูุจ",
"ู
ุตุฑ",
"ู+ู+ุณุงุนุฏ",
"ูู",
"ุญู",
"ุงู+ู
ุดูู+ุฉ",
"ุ",
"ุฌูุฒ+ู+ูุง",
"ุจูู",
"EOS"
] | [
"PART",
"DET+NOUN",
"NOUN",
"DET+NOUN",
"PROG_PART+V",
"PART",
"DET+NOUN",
"ADJ+NSUFF",
"PROG_PART+V+PRON",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PUNC",
"CONJ+PRON",
"FUT_PART+V",
"NOUN",
"NOUN",
"CONJ+FUT_PART+V",
"PREP",
"NOUN",
"DET+NOUN+NSUFF",
"PUNC",
"V+PRON+PRON",
"ADV",
"EOS"
] |
5 | "B" | [
"ุงูู
ุฑุงู",
"ู
ุด",
"ุนุงูุฒู",
"ุงุญุชูุงูุงุช",
"ุงูู
ุฑุฃู",
"ุนุงูุฒู",
"ู
ูู",
"ุงุญุชุฑุงู
",
"ููู",
"ู
ุงุดูู",
"ูุดุงุฑุน",
"ู
ุชุนูุณูุงุด",
"ูู",
"ุฑุงูุจู",
"ู
ูุงุตูุงุช",
"ููู
",
"ุงูุช",
"ููู",
"ุชุนุฏ",
"ุนุงูุฒู",
"ุงุญุชุฑุงู
",
"ูุจุณ",
"EOS"
] | [
"ุงู+ู
ุฑุง+ู",
"ู
ุด",
"ุนุงูุฒ+ู",
"ุงุญุชูุงู+ุงุช",
"ุงู+ู
ุฑุฃ+ู",
"ุนุงูุฒ+ู",
"ู
ู+ู",
"ุงุญุชุฑุงู
",
"ู+ูู",
"ู
ุงุดู+ู",
"ู+ุดุงุฑุน",
"ู
+ุชุนูุณ+ูุง+ุด",
"ูู",
"ุฑุงูุจ+ู",
"ู
ูุงุตู+ุงุช",
"ููู
",
"ุงูุช",
"ู+ูู",
"ุชุนุฏ",
"ุนุงูุฒ+ู",
"ุงุญุชุฑุงู
",
"ู+ุจุณ",
"EOS"
] | [
"DET+NOUN+NSUFF",
"PART",
"ADJ+NSUFF",
"NOUN+NSUFF",
"DET+NOUN+NSUFF",
"ADJ+NSUFF",
"PREP+PRON",
"NOUN",
"CONJ+PRON",
"ADJ+NSUFF",
"PREP+NOUN",
"PART+V+PRON+NEG_PART",
"PART",
"ADJ+NSUFF",
"NOUN+NSUFF",
"V",
"PRON",
"CONJ+PRON",
"V",
"ADJ+NSUFF",
"NOUN",
"CONJ+ADV",
"EOS"
] |
1 | "B" | [
"ู
ุญุฏุด",
"ุจูุฎุชุงุฑ",
"ุขููุฉ",
"ุฃู",
"ุญูุงุชุฉ",
"ุจุณ",
"ุจุชูุฏุฑ",
"ุชุฎุชุงุฑ",
"ูุชุญุฏุฏ",
"ุตุญุงุจู",
"ุ",
"ู
ุณุชูุจูู",
"ุ",
"ุญูู
ู",
"ู
ุชุฎููุด",
"ุญุฏ",
"ูุญุณุณู",
"ุงูู",
"ุฃูู",
"ู
ูุฉ",
"ู
ูู
ุง",
"ูุงู",
"ุงูุณุจุจ",
"EOS"
] | [
"ู
+ุญุฏ+ุด",
"ุจ+ูุฎุชุงุฑ",
"ุขูู+ุฉ",
"ุฃู",
"ุญูุง+ุช+ุฉ",
"ุจุณ",
"ุจ+ุชูุฏุฑ",
"ุชุฎุชุงุฑ",
"ู+ุชุญุฏุฏ",
"ุตุญุงุจ+ู",
"ุ",
"ู
ุณุชูุจู+ู",
"ุ",
"ุญูู
+ู",
"ู
+ุชุฎู+ู+ุด",
"ุญุฏ",
"ูุญุณุณ+ู",
"ุงู+ู",
"ุฃูู",
"ู
ู+ุฉ",
"ู
ูู
ุง",
"ูุงู",
"ุงู+ุณุจุจ",
"EOS"
] | [
"PART+NOUN+NEG_PART",
"PROG_PART+V",
"NOUN+PRON",
"CONJ",
"NOUN+NSUFF+PRON",
"PART",
"PROG_PART+V",
"V",
"CONJ+V",
"NOUN+PRON",
"PUNC",
"NOUN+PRON",
"PUNC",
"NOUN+PRON",
"PART+V+PRON+NEG_PART",
"NOUN",
"V+PRON",
"PART+PRON",
"ADJ",
"PREP+PRON",
"PART",
"V",
"DET+NOUN",
"EOS"
] |
4 | "B" | [
"ู
ู
ูู",
"ูููู",
"ุงูุนูุจ",
"ูููุง",
"ุงู",
"ู
ุด",
"ุนุงุฌุจูุง",
"ุญุงููุง",
"ูุงุฒู
",
"ุชุจุฏุฃ",
"ุชุญุจ",
"ููุณู",
"ู",
"ุชุดูููุง",
"ุญููุฉ",
"ุนุดุงู",
"ุงููุงุณ",
"ูู
ุงู",
"ุชุดููู",
"ูุฏุฉ",
"ูุฃู",
"ุจุจุณุงุทุฉ",
"ู
ุญุฏุด",
"ููุญุจู",
"ูุงูุช",
"ู
ุจุชุญุจุด",
"ููุณู",
"(",
"2",
")",
"EOS"
] | [
"ู
ู
ูู",
"ูููู",
"ุงู+ุนูุจ",
"ูู+ูุง",
"ุงู",
"ู
ุด",
"ุนุงุฌุจ+ูุง",
"ุญุงู+ูุง",
"ูุงุฒู
",
"ุชุจุฏุฃ",
"ุชุญุจ",
"ููุณ+ู",
"ู",
"ุชุดูู+ูุง",
"ุญูู+ุฉ",
"ุนุดุงู",
"ุงู+ูุงุณ",
"ูู
ุงู",
"ุชุดูู+ู",
"ูุฏุฉ",
"ู+ุฃู",
"ุจ+ุจุณุงุท+ุฉ",
"ู
+ุญุฏ+ุด",
"ู+ูุญุจ+ู",
"ู+ุงูุช",
"ู
+ุจ+ุชุญุจ+ุด",
"ููุณ+ู",
"(",
"2",
")",
"EOS"
] | [
"ADJ",
"V",
"DET+NOUN",
"PREP+PRON",
"PART",
"PART",
"ADJ+PRON",
"NOUN+PRON",
"ADJ",
"V",
"V",
"NOUN+PRON",
"CONJ",
"V+PRON",
"ADJ+NSUFF",
"PART",
"DET+NOUN",
"ADV",
"V+PRON",
"ADV",
"PREP+PART",
"PREP+NOUN+NSUFF",
"PART+NOUN+NEG_PART",
"FUT_PART+V+PRON",
"CONJ+PRON",
"PART+PROG_PART+V+NEG_PART",
"NOUN+PRON",
"PUNC",
"NUM",
"PUNC",
"EOS"
] |
3 | "B" | [
"ุงูุชูุง",
"ู
ุด",
"ู
ุชุฎูููู",
"ุงูุง",
"ุจูุฑู",
"ุงููููู",
"ุงุฒุงู",
".",
".",
".",
"ุงูุง",
"ุจู
ุดู",
"ุงุณุชุฎุจู",
"ู
ู",
"ุงููุงุณ",
"ุงููู",
"ู
ุจุญุจูุงุด",
"ู",
"ุฏูู",
"ูุชูุฑ",
"EOS"
] | [
"ุงูุชูุง",
"ู
ุด",
"ู
ุชุฎูู+ูู",
"ุงูุง",
"ุจูุฑ+ู",
"ุงู+ููู+ู",
"ุงุฒุงู",
".",
".",
".",
"ุงูุง",
"ุจ+ู
ุดู",
"ุงุณุชุฎุจู",
"ู
ู",
"ุงู+ูุงุณ",
"ุงููู",
"ู
+ุจ+ุญุจ+ูุง+ุด",
"ู",
"ุฏูู",
"ูุชูุฑ",
"EOS"
] | [
"PRON",
"PART",
"ADJ+NSUFF",
"PRON",
"NOUN+NSUFF",
"DET+NOUN+NSUFF",
"PART",
"PUNC",
"PUNC",
"PUNC",
"PRON",
"PROG_PART+V",
"V",
"PREP",
"DET+NOUN",
"PART",
"PART+PROG_PART+V+PRON+NEG_PART",
"CONJ",
"PRON",
"ADJ",
"EOS"
] |
5 | "B" | [
"ูู
ุง",
"ุงุฌู",
"ุงุบุณู",
"ุณูุงูู",
"ูุงุดู
",
"ุฑูุญุฉ",
"ู
ุฌุงุฑู",
"ู",
"ุงู
",
"ุงูู
ูุงุฉ",
"ุชุจูู",
"ุนูุดุฉ",
"ุชูุฑู",
"ุญุชู",
"ุงูู
ูุงุฉ",
"ู
ุด",
"ุนุงุฑููู",
"ูุดุฑุจูุง",
"ุงูููููููููููููููููููููููููููููููููููููุฉ",
"ุงูุฐู",
"ุฏุฉ",
"EOS"
] | [
"ูู
ุง",
"ุงุฌู",
"ุงุบุณู",
"ุณูุงู+ู",
"ู+ุงุดู
",
"ุฑูุญ+ุฉ",
"ู
ุฌุงุฑู",
"ู",
"ุงู
",
"ุงู+ู
ูุงุฉ",
"ุชุจูู",
"ุนูุด+ุฉ",
"ุชูุฑู",
"ุญุชู",
"ุงู+ู
ูุงุฉ",
"ู
ุด",
"ุนุงุฑู+ูู",
"ูุดุฑุจ+ูุง",
"ุงูููููููููููููููููููููููููููููููููููููุฉ",
"ุงู+ุฐู",
"ุฏุฉ",
"EOS"
] | [
"PART",
"V",
"V",
"NOUN+PRON",
"CONJ+V",
"NOUN+NSUFF",
"NOUN",
"PREP",
"NOUN",
"DET+NOUN",
"V",
"NOUN+NSUFF",
"V",
"PART",
"DET+NOUN",
"PART",
"ADJ+NSUFF",
"V+PRON",
"PART",
"DET+NOUN",
"PRON",
"EOS"
] |
3 | "B" | [
"ุจุจูู",
"ู
ุญุฑุฌ",
"ู
ู",
"ุงููุงุณ",
"ุงููู",
"ุนู
ุฑู",
"ู
ุงุดููุช",
"ู
ููู
",
"ุญุงุฌุฉ",
"ูุญุดุฉ",
"ุจุณ",
"ููู",
"ุญุงุฌุฒ",
"ููุณู",
"ูุงุญูุชูู
",
"ูู
ุฌุฑุฏ",
"ุงููู
",
"ุจูููุฑููู",
"ุจุฃูุงู
",
"ุฒุจุงูุฉ",
".",
"EOS"
] | [
"ุจ+ุจูู",
"ู
ุญุฑุฌ",
"ู
ู",
"ุงู+ูุงุณ",
"ุงููู",
"ุนู
ุฑ+ู",
"ู
ุง+ุดูู+ุช",
"ู
ู+ูู
",
"ุญุงุฌ+ุฉ",
"ูุญุด+ุฉ",
"ุจุณ",
"ูู+ู",
"ุญุงุฌุฒ",
"ููุณู",
"ูุงุญู+ุช+ูู
",
"ู+ู
ุฌุฑุฏ",
"ุงู+ูู
",
"ุจ+ูููุฑ+ู+ูู",
"ุจ+ุฃูุงู
",
"ุฒุจุงู+ุฉ",
".",
"EOS"
] | [
"PROG_PART+V",
"ADJ",
"PREP",
"DET+NOUN",
"PART",
"NOUN+PRON",
"PART+V+PRON",
"PREP+PRON",
"NOUN+NSUFF",
"ADJ+NSUFF",
"PART",
"PREP+PRON",
"NOUN",
"ADJ",
"NOUN+NSUFF+PRON",
"PREP+NOUN",
"PART+PRON",
"PROG_PART+V+PRON+PRON",
"PREP+NOUN",
"NOUN+NSUFF",
"PUNC",
"EOS"
] |
1 | "B" | [
"ู
ุนูุฏูุด",
"ุตุญุงุจ",
"ูู",
"ุงูุญูููุฉ",
"ุงุฎุฑุฌ",
"ู
ุนุงูู
",
"ูุงูููุงู
",
"ุฏู",
"ุนุดุงู",
"ูู",
"ุงููู",
"ุงุนุฑููู
",
"ูู",
"ุงูุญูููุฉ",
"ุจููุฑููุง",
"ุจุนุถ",
"ูุจูู
ุซููุง",
"ุงููู
",
"ุจูุญุจูุง",
"ุจุนุถ",
".",
".",
"EOS"
] | [
"ู
+ุนูุฏ+ู+ุด",
"ุตุญุงุจ",
"ูู",
"ุงู+ุญููู+ุฉ",
"ุงุฎุฑุฌ",
"ู
ุนุง+ูู
",
"ู+ุงู+ููุงู
",
"ุฏู",
"ุนุดุงู",
"ูู",
"ุงููู",
"ุงุนุฑู+ูู
",
"ูู",
"ุงู+ุญููู+ุฉ",
"ุจ+ููุฑู+ูุง",
"ุจุนุถ",
"ู+ุจ+ูู
ุซู+ูุง",
"ุงู+ูู
",
"ุจ+ูุญุจ+ูุง",
"ุจุนุถ",
".",
".",
"EOS"
] | [
"PART+NOUN+PRON+NEG_PART",
"NOUN",
"PREP",
"DET+NOUN+NSUFF",
"V",
"NOUN+PRON",
"CONJ+DET+NOUN",
"PRON",
"PART",
"NOUN",
"PART",
"V+PRON",
"PREP",
"DET+NOUN+NSUFF",
"PROG_PART+V+PRON",
"NOUN",
"CONJ+PROG_PART+V+PRON",
"PART+PRON",
"PROG_PART+V+PRON",
"NOUN",
"PUNC",
"PUNC",
"EOS"
] |
4 | "B" | [
"ุงูุจูุช",
"ุงููู",
"ุจุชุณูุช",
"ูุชูุฑ",
"ุจุชุนูุท",
"ูุชูุฑ",
"!",
"ูุฑุจูุง",
"ููููู",
"ุดุฑ",
"ุงูุจูุช",
"ูู
ุง",
"ุชููู",
"ู
ุจุณูุทู",
"ูุชุตุฏุนู",
"ู
ู",
"ูุชุฑ",
"ุงูููุงู
",
"!",
"EOS"
] | [
"ุงู+ุจูุช",
"ุงููู",
"ุจ+ุชุณูุช",
"ูุชูุฑ",
"ุจ+ุชุนูุท",
"ูุชูุฑ",
"!",
"ู+ุฑุจ+ูุง",
"ูููู+ู",
"ุดุฑ",
"ุงู+ุจูุช",
"ูู
ุง",
"ุชููู",
"ู
ุจุณูุท+ู",
"ู+ุชุตุฏุน+ู",
"ู
ู",
"ูุชุฑ",
"ุงู+ููุงู
",
"!",
"EOS"
] | [
"DET+NOUN",
"PART",
"PROG_PART+V",
"ADJ",
"PROG_PART+V",
"ADJ",
"PUNC",
"CONJ+NOUN+PRON",
"V+PRON",
"NOUN",
"DET+NOUN",
"PART",
"V",
"ADJ+NSUFF",
"FUT_PART+V+PRON",
"PREP",
"NOUN",
"DET+NOUN",
"PUNC",
"EOS"
] |
4 | "B" | [
"ุงูู
ุตุฑู",
"ุงููุญูุฏ",
"ุงููู",
"ูู",
"ุญุตูุชูู",
"ู
ุตูุจู",
"ูุนุฑู",
"ุงููุง",
"ู
ุด",
"ุนูุฏู",
"ููุญุฏู",
"ูุฑุชุงุญ",
"ูุนูู",
"ู
ุซูุง",
"ูู",
"ุงูููุฑ",
"ููุทุน",
"ูุฑูุญ",
"ูุจุต",
"ุนูุฏ",
"ุฌุงุฑู",
"ูู",
"ููุงู",
"ูุงุทุน",
"ูุฑุชุงุญ",
"EOS"
] | [
"ุงู+ู
ุตุฑู",
"ุงู+ูุญูุฏ",
"ุงููู",
"ูู",
"ุญุตู+ุช+ู+ู",
"ู
ุตูุจ+ู",
"ู+ุนุฑู",
"ุงู+ูุง",
"ู
ุด",
"ุนูุฏ+ู",
"ู+ูุญุฏ+ู",
"ูุฑุชุงุญ",
"ูุนูู",
"ู
ุซู+ุง",
"ูู",
"ุงู+ููุฑ",
"ูุทุน",
"ูุฑูุญ",
"ูุจุต",
"ุนูุฏ",
"ุฌุงุฑ+ู",
"ูู",
"ูู+ุง+ู",
"ูุงุทุน",
"ูุฑุชุงุญ",
"EOS"
] | [
"DET+NOUN",
"DET+ADJ",
"PART",
"PART",
"V+PRON+PREP+PRON",
"NOUN+NSUFF",
"CONJ+V",
"PART+PRON",
"PART",
"NOUN+PRON",
"PREP+NOUN+PRON",
"V",
"ADV",
"NOUN+CASE",
"PART",
"DET+NOUN",
"V",
"V",
"V",
"NOUN",
"NOUN+PRON",
"PART",
"V+PRON+PRON",
"ADJ",
"V",
"EOS"
] |
Dataset Card for Arabic POS Dialect
Dataset Summary
This dataset was created to support part of speech (POS) tagging in dialects of Arabic. It contains sets of 350 manually segmented and POS tagged tweets for each of four dialects: Egyptian, Levantine, Gulf, and Maghrebi.
Supported Tasks and Leaderboards
The dataset can be used to train a model for Arabic token segmentation and part of speech tagging in Arabic dialects. Success on this task is typically measured by achieving a high accuracy over a held out dataset. Darwish et al. (2018) train a CRF model across all four dialects and achieve an average accuracy of 89.3%.
Languages
The BCP-47 code is ar-Arab. The dataset consists of four dialects of Arabic, Egyptian (EGY), Levantine (LEV), Gulf (GLF), and Maghrebi (MGR), written in Arabic script.
Dataset Structure
Data Instances
Below is a partial example from the Egyptian set:
- `Fold`: 4
- `SubFold`: A
- `Word`: [ููู, ูู
ุง, ุชุญุจ, ุญุฏ, ู
ู, ููุจู, ...]
- `Segmentation`: [ููู, ูู
ุง, ุชุญุจ, ุญุฏ, ู
ู, ููุจ+ู, ...]
- `POS`: [PART, PART, V, NOUN, PREP, NOUN+PRON, ...]
Data Fields
The fold
and the subfold
fields refer to the crossfold validation splits used by Darwish et al., which can be generated using this script.
fold
: An int32 indicating which fold the instance was in for the crossfold validationsubfold
: A string, either 'A' or 'B', indicating which subfold the instance was in for the crossfold validationwords
: A sequence of strings of the unsegmented tokensegments
: A sequence of strings consisting of the segments of the word separated by '+' if there is more than one segmentpos_tags
: A sequence of strings of the part of speech tags of the segments separated by '+' if there is more than one segment
The POS tags consist of a set developed by Darwish et al. (2017) for Modern Standard Arabic (MSA) plus an additional 6 tags (2 dialect-specific tags and 4 tweet-specific tags).
Tag | Purpose | Description |
---|---|---|
ADV | MSA | Adverb |
ADJ | MSA | Adjective |
CONJ | MSA | Conjunction |
DET | MSA | Determiner |
NOUN | MSA | Noun |
NSUFF | MSA | Noun suffix |
NUM | MSA | Number |
PART | MSA | Particle |
PREP | MSA | Preposition |
PRON | MSA | Pronoun |
PUNC | MSA | Preposition |
V | MSA | Verb |
ABBREV | MSA | Abbreviation |
CASE | MSA | Alef of tanween fatha |
JUS | MSA | Jussification attached to verbs |
VSUFF | MSA | Verb Suffix |
FOREIGN | MSA | Non-Arabic as well as non-MSA words |
FUR_PART | MSA | Future particle "s" prefix and "swf" |
PROG_PART | Dialect | Progressive particle |
NEG_PART | Dialect | Negation particle |
HASH | Tweet | Hashtag |
EMOT | Tweet | Emoticon/Emoji |
MENTION | Tweet | Mention |
URL | Tweet | URL |
Data Splits
The dataset is split by dialect.
Dialect | Tweets | Words |
---|---|---|
Egyptian (EGY) | 350 | 7481 |
Levantine (LEV) | 350 | 7221 |
Gulf (GLF) | 350 | 6767 |
Maghrebi (MGR) | 350 | 6400 |
Dataset Creation
Curation Rationale
This dataset was created to address the lack of computational resources available for dialects of Arabic. These dialects are typically used in speech, while written forms of the language are typically in Modern Standard Arabic. Social media, however, has provided a venue for people to use dialects in written format.
Source Data
This dataset builds off of the work of Eldesouki et al. (2017) and Samih et al. (2017b) who originally collected the tweets.
Initial Data Collection and Normalization
They started with 175 million Arabic tweets returned by the Twitter API using the query "lang:ar" in March 2014. They then filtered this set using author-identified locations and tokens that are unique to each dialect. Finally, they had native speakers of each dialect select 350 tweets that were heavily accented.
Who are the source language producers?
The source language producers are people who posted on Twitter in Arabic using dialectal words from countries where the dialects of interest were spoken, as identified in Mubarak and Darwish (2014).
Annotations
Annotation process
The segmentation guidelines are available at https://alt.qcri.org/resources1/da_resources/seg-guidelines.pdf. The tagging guidelines are not provided, but Darwish at al. note that there were multiple rounds of quality control and revision.
Who are the annotators?
The POS tags were annotated by native speakers of each dialect. Further information is not known.
Personal and Sensitive Information
[More Information Needed]
Considerations for Using the Data
Social Impact of Dataset
Darwish et al find that the accuracy on the Maghrebi dataset suffered the most when the training set was from another dialect, and conversely training on Maghrebi yielded the worst results for all the other dialects. They suggest that Egyptian, Levantine, and Gulf may be more similar to each other and Maghrebi the most dissimilar to all of them. They also find that training on Modern Standard Arabic (MSA) and testing on dialects yielded significantly lower results compared to training on dialects and testing on MSA. This suggests that dialectal variation should be a significant consideration for future work in Arabic NLP applications, particularly when working with social media text.
Discussion of Biases
[More Information Needed]
Other Known Limitations
[More Information Needed]
Additional Information
Dataset Curators
This dataset was curated by Kareem Darwish, Hamdy Mubarak, Mohamed Eldesouki and Ahmed Abdelali with the Qatar Computing Research Institute (QCRI), Younes Samih and Laura Kallmeyer with the University of Dusseldorf, Randah Alharbi and Walid Magdy with the University of Edinburgh, and Mohammed Attia with Google. No funding information was included.
Licensing Information
This dataset is licensed under the Apache License, Version 2.0.
Citation Information
Kareem Darwish, Hamdy Mubarak, Ahmed Abdelali, Mohamed Eldesouki, Younes Samih, Randah Alharbi, Mohammed Attia, Walid Magdy and Laura Kallmeyer (2018) Multi-Dialect Arabic POS Tagging: A CRF Approach. Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018), May 7-12, 2018. Miyazaki, Japan.
@InProceedings{DARWISH18.562,
author = {Kareem Darwish ,Hamdy Mubarak ,Ahmed Abdelali ,Mohamed Eldesouki ,Younes Samih ,Randah Alharbi ,Mohammed Attia ,Walid Magdy and Laura Kallmeyer},
title = {Multi-Dialect Arabic POS Tagging: A CRF Approach},
booktitle = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
year = {2018},
month = {may},
date = {7-12},
location = {Miyazaki, Japan},
editor = {Nicoletta Calzolari (Conference chair) and Khalid Choukri and Christopher Cieri and Thierry Declerck and Sara Goggi and Koiti Hasida and Hitoshi Isahara and Bente Maegaard and Joseph Mariani and Hรฉlรจne Mazo and Asuncion Moreno and Jan Odijk and Stelios Piperidis and Takenobu Tokunaga},
publisher = {European Language Resources Association (ELRA)},
address = {Paris, France},
isbn = {979-10-95546-00-9},
language = {english}
}
Contributions
Thanks to @mcmillanmajora for adding this dataset.
- Downloads last month
- 963