Secure your code as it's written. Use Snyk Code to scan source code in minutes - no build needed - and fix issues immediately.
def test_augment_terminal():
a = augment_terminal("so_subj_op_þf", "langaði", "OP-GM-FH-ÞT-3P-ET")
assert a == "so_subj_op_þf_et_fh_gm_þt"
a = augment_terminal("so_subj_sagnb_þf", "langað", "GM-SAGNB")
assert a == "so_subj_sagnb_þf_gm"
a = augment_terminal("so_subj_lhþt_et_kvk", "valin", "LHÞT-SB-KVK-NFET")
assert a == "so_subj_lhþt_et_kvk_nf_sb"
a = augment_terminal("so_subj_nh", "skorta", "GM-NH")
assert a == "so_subj_nh_gm"
a = augment_terminal("so_subj_nh_þgf", "blöskra", "GM-NH")
assert a == "so_subj_nh_þgf_gm"
a = augment_terminal("so_1_þf_subj_op_þgf", "þraut", "OP-GM-FH-ÞT-1P-ET")
assert a == "so_1_þf_subj_op_þgf_et_fh_gm_þt"
a = augment_terminal("so_2_þgf_þf_p1_et", "skrifa", "GM-FH-NT-1P-ET")
assert a == "so_2_þgf_þf_et_fh_gm_nt_p1"
a = augment_terminal("so_0_lhþt_et_kk", "kembdur", "LHÞT-SB-KK-NFET")
assert a == "so_0_et_kk_lhþt_nf_sb"
def test_augment_terminal():
a = augment_terminal("so_subj_op_þf", "langaði", "OP-GM-FH-ÞT-3P-ET")
assert a == "so_subj_op_þf_et_fh_gm_þt"
a = augment_terminal("so_subj_sagnb_þf", "langað", "GM-SAGNB")
assert a == "so_subj_sagnb_þf_gm"
a = augment_terminal("so_subj_lhþt_et_kvk", "valin", "LHÞT-SB-KVK-NFET")
assert a == "so_subj_lhþt_et_kvk_nf_sb"
a = augment_terminal("so_subj_nh", "skorta", "GM-NH")
assert a == "so_subj_nh_gm"
a = augment_terminal("so_subj_nh_þgf", "blöskra", "GM-NH")
assert a == "so_subj_nh_þgf_gm"
a = augment_terminal("so_1_þf_subj_op_þgf", "þraut", "OP-GM-FH-ÞT-1P-ET")
assert a == "so_1_þf_subj_op_þgf_et_fh_gm_þt"
a = augment_terminal("so_2_þgf_þf_p1_et", "skrifa", "GM-FH-NT-1P-ET")
assert a == "so_2_þgf_þf_et_fh_gm_nt_p1"
a = augment_terminal("so_0_lhþt_et_kk", "kembdur", "LHÞT-SB-KK-NFET")
assert a == "so_0_et_kk_lhþt_nf_sb"
def test_augment_terminal():
a = augment_terminal("so_subj_op_þf", "langaði", "OP-GM-FH-ÞT-3P-ET")
assert a == "so_subj_op_þf_et_fh_gm_þt"
a = augment_terminal("so_subj_sagnb_þf", "langað", "GM-SAGNB")
assert a == "so_subj_sagnb_þf_gm"
a = augment_terminal("so_subj_lhþt_et_kvk", "valin", "LHÞT-SB-KVK-NFET")
assert a == "so_subj_lhþt_et_kvk_nf_sb"
a = augment_terminal("so_subj_nh", "skorta", "GM-NH")
assert a == "so_subj_nh_gm"
a = augment_terminal("so_subj_nh_þgf", "blöskra", "GM-NH")
assert a == "so_subj_nh_þgf_gm"
a = augment_terminal("so_1_þf_subj_op_þgf", "þraut", "OP-GM-FH-ÞT-1P-ET")
assert a == "so_1_þf_subj_op_þgf_et_fh_gm_þt"
a = augment_terminal("so_2_þgf_þf_p1_et", "skrifa", "GM-FH-NT-1P-ET")
assert a == "so_2_þgf_þf_et_fh_gm_nt_p1"
a = augment_terminal("so_0_lhþt_et_kk", "kembdur", "LHÞT-SB-KK-NFET")
assert a == "so_0_et_kk_lhþt_nf_sb"
def test_augment_terminal():
a = augment_terminal("so_subj_op_þf", "langaði", "OP-GM-FH-ÞT-3P-ET")
assert a == "so_subj_op_þf_et_fh_gm_þt"
a = augment_terminal("so_subj_sagnb_þf", "langað", "GM-SAGNB")
assert a == "so_subj_sagnb_þf_gm"
a = augment_terminal("so_subj_lhþt_et_kvk", "valin", "LHÞT-SB-KVK-NFET")
assert a == "so_subj_lhþt_et_kvk_nf_sb"
a = augment_terminal("so_subj_nh", "skorta", "GM-NH")
assert a == "so_subj_nh_gm"
a = augment_terminal("so_subj_nh_þgf", "blöskra", "GM-NH")
assert a == "so_subj_nh_þgf_gm"
a = augment_terminal("so_1_þf_subj_op_þgf", "þraut", "OP-GM-FH-ÞT-1P-ET")
assert a == "so_1_þf_subj_op_þgf_et_fh_gm_þt"
a = augment_terminal("so_2_þgf_þf_p1_et", "skrifa", "GM-FH-NT-1P-ET")
assert a == "so_2_þgf_þf_et_fh_gm_nt_p1"
a = augment_terminal("so_0_lhþt_et_kk", "kembdur", "LHÞT-SB-KK-NFET")
assert a == "so_0_et_kk_lhþt_nf_sb"
def test_augment_terminal():
a = augment_terminal("so_subj_op_þf", "langaði", "OP-GM-FH-ÞT-3P-ET")
assert a == "so_subj_op_þf_et_fh_gm_þt"
a = augment_terminal("so_subj_sagnb_þf", "langað", "GM-SAGNB")
assert a == "so_subj_sagnb_þf_gm"
a = augment_terminal("so_subj_lhþt_et_kvk", "valin", "LHÞT-SB-KVK-NFET")
assert a == "so_subj_lhþt_et_kvk_nf_sb"
a = augment_terminal("so_subj_nh", "skorta", "GM-NH")
assert a == "so_subj_nh_gm"
a = augment_terminal("so_subj_nh_þgf", "blöskra", "GM-NH")
assert a == "so_subj_nh_þgf_gm"
a = augment_terminal("so_1_þf_subj_op_þgf", "þraut", "OP-GM-FH-ÞT-1P-ET")
assert a == "so_1_þf_subj_op_þgf_et_fh_gm_þt"
a = augment_terminal("so_2_þgf_þf_p1_et", "skrifa", "GM-FH-NT-1P-ET")
assert a == "so_2_þgf_þf_et_fh_gm_nt_p1"
a = augment_terminal("so_0_lhþt_et_kk", "kembdur", "LHÞT-SB-KK-NFET")
assert a == "so_0_et_kk_lhþt_nf_sb"
for ix, token in enumerate(tokens):
# We have already cut away paragraph and sentence markers
# (P_BEGIN/P_END/S_BEGIN/S_END)
terminal, meaning = tmap.get(ix, (None, None))
d = describe_token(ix, token, terminal, meaning)
if words is not None:
wt = TreeUtility._word_tuple(token, terminal, meaning)
if wt is not None:
# Add the (stem, cat) combination to the words dictionary
words[wt] += 1
if ix == error_index:
# Mark the error token, if present
d["err"] = 1
if meaning is not None and "x" in d:
# Also return the augmented terminal name
d["a"] = augment_terminal(
terminal.name, d["x"].lower(), meaning.beyging
)
dump.append(d)
return dump