Entity Matching by Similarity Join
 
Loading...
Searching...
No Matches
simjoin_entitymatching.matcher.match Namespace Reference

Functions

 train_model (tableA, tableB, gold_graph, blocking_attr, model_path, tree_path, range_path, num_tree, sample_size, ground_truth_label, write_all_features=True, write_used_features=False, training_strategy=Literal['basic', 'tuning', 'active'], inmemory=Literal[0, 1], num_data=Literal[1, 2], at_ltable=None, at_rtable=None, dataname=None, default_sample_res_dir="", default_vmatcher_dir="", default_gold_dir="", default_icv_dir="", default_feature_name_dir="")
 
 match_via_megallen_features (tableA, tableB, gold_graph, gold_len, model_path, is_interchangeable, flag_consistent, at_ltable=None, at_rtable=None, group=None, cluster=None, default_blk_res_dir="", default_match_res_dir="", default_fea_names_dir="")
 
 match_via_cpp_features (tableA, tableB, gold_graph, gold_len, model_path, is_interchangeable, flag_consistent, numeric_attr, at_ltable=None, at_rtable=None, default_blk_res_dir="", default_match_res_dir="", default_fea_names_dir="", default_icv_dir="")
 
 match_on_neg_pres (tableA, tableB, gold_graph, gold_len, model_path, is_interchangeable, flag_consistent, numeric_attr, at_ltable=None, at_rtable=None, default_match_res_dir="", default_fea_names_dir="", default_icv_dir="")
 
 debug_rf_matcher (tableA, tableB, gold_graph, gold_len, model_path, is_interchangeable, flag_consistent, numeric_attr, at_ltable=None, at_rtable=None, default_match_res_dir="", default_fea_names_dir="", default_icv_dir="")
 

Function Documentation

◆ debug_rf_matcher()

simjoin_entitymatching.matcher.match.debug_rf_matcher ( tableA,
tableB,
gold_graph,
gold_len,
model_path,
is_interchangeable,
flag_consistent,
numeric_attr,
at_ltable = None,
at_rtable = None,
default_match_res_dir = "",
default_fea_names_dir = "",
default_icv_dir = "" )

◆ match_on_neg_pres()

simjoin_entitymatching.matcher.match.match_on_neg_pres ( tableA,
tableB,
gold_graph,
gold_len,
model_path,
is_interchangeable,
flag_consistent,
numeric_attr,
at_ltable = None,
at_rtable = None,
default_match_res_dir = "",
default_fea_names_dir = "",
default_icv_dir = "" )

◆ match_via_cpp_features()

simjoin_entitymatching.matcher.match.match_via_cpp_features ( tableA,
tableB,
gold_graph,
gold_len,
model_path,
is_interchangeable,
flag_consistent,
numeric_attr,
at_ltable = None,
at_rtable = None,
default_blk_res_dir = "",
default_match_res_dir = "",
default_fea_names_dir = "",
default_icv_dir = "" )

◆ match_via_megallen_features()

simjoin_entitymatching.matcher.match.match_via_megallen_features ( tableA,
tableB,
gold_graph,
gold_len,
model_path,
is_interchangeable,
flag_consistent,
at_ltable = None,
at_rtable = None,
group = None,
cluster = None,
default_blk_res_dir = "",
default_match_res_dir = "",
default_fea_names_dir = "" )

◆ train_model()

simjoin_entitymatching.matcher.match.train_model ( tableA,
tableB,
gold_graph,
blocking_attr,
model_path,
tree_path,
range_path,
num_tree,
sample_size,
ground_truth_label,
write_all_features = True,
write_used_features = False,
training_strategy = Literal['basic', 'tuning', 'active'],
inmemory = Literal[0, 1],
num_data = Literal[1, 2],
at_ltable = None,
at_rtable = None,
dataname = None,
default_sample_res_dir = "",
default_vmatcher_dir = "",
default_gold_dir = "",
default_icv_dir = "",
default_feature_name_dir = "" )