parent
7ef6b87cb8
commit
ff52072867
@ -1,20 +1,23 @@
|
|||||||
from sentence_transformers import SentenceTransformer
|
from sentence_transformers import SentenceTransformer
|
||||||
import numpy as np
|
import numpy as np
|
||||||
|
|
||||||
ltable_path = r'E:\Data\Research\Projects\matching_dependency\datasets\iTunes-Amazon_dirty\tableA.csv'
|
ltable_path = r'E:\Data\Research\Projects\matching_dependency\datasets\Abt-Buy\tableA.csv'
|
||||||
rtable_path = r'E:\Data\Research\Projects\matching_dependency\datasets\iTunes-Amazon_dirty\tableB.csv'
|
rtable_path = r'E:\Data\Research\Projects\matching_dependency\datasets\Abt-Buy\tableB.csv'
|
||||||
mapping_path = r'E:\Data\Research\Projects\matching_dependency\datasets\iTunes-Amazon_dirty\matches.csv'
|
mapping_path = r'E:\Data\Research\Projects\matching_dependency\datasets\Abt-Buy\matches.csv'
|
||||||
mapping_lid = 'ltable_id' # mapping表中左表id名
|
mapping_lid = 'idAbt' # mapping表中左表id名
|
||||||
mapping_rid = 'rtable_id' # mapping表中右表id名
|
mapping_rid = 'idBuy' # mapping表中右表id名
|
||||||
ltable_id = 'id' # 左表id字段名称
|
ltable_id = 'id' # 左表id字段名称
|
||||||
rtable_id = 'id' # 右表id字段名称
|
rtable_id = 'id' # 右表id字段名称
|
||||||
target_attr = 'id' # 进行md挖掘时的目标字段
|
target_attr = 'id' # 进行md挖掘时的目标字段
|
||||||
# lr_attrs_map = {} # 如果两个表中存在对应字段名称不一样的情况,将名称加入列表便于调整一致
|
# lr_attrs_map = {} # 如果两个表中存在对应字段名称不一样的情况,将名称加入列表便于调整一致
|
||||||
similarity_threshold = 0.16
|
|
||||||
support_threshold = 70
|
model = SentenceTransformer('E:\\Data\\Research\\Models\\roberta-large-nli-stsb-mean-tokens')
|
||||||
confidence_threshold = 0.3
|
similarity_threshold = 0.2
|
||||||
interpre_weight = 1 # 可解释性权重
|
support_threshold = 100
|
||||||
|
confidence_threshold = 0.4
|
||||||
|
interpre_weight = 0.5 # 可解释性权重
|
||||||
|
|
||||||
er_output_dir = 'E:\\Data\\Research\\Projects\\matching_dependency\\ml_er\\output\\'
|
er_output_dir = 'E:\\Data\\Research\\Projects\\matching_dependency\\ml_er\\output\\'
|
||||||
md_output_dir = 'E:\\Data\\Research\\Projects\\matching_dependency\\md_discovery\\output\\'
|
md_output_dir = 'E:\\Data\\Research\\Projects\\matching_dependency\\md_discovery\\output\\'
|
||||||
hpo_output_dir = 'E:\\Data\\Research\\Projects\\matching_dependency\\hpo\\output\\'
|
hpo_output_dir = 'E:\\Data\\Research\\Projects\\matching_dependency\\hpo\\output\\'
|
||||||
model = SentenceTransformer('E:\\Data\\Research\\Models\\roberta-large-nli-stsb-mean-tokens')
|
|
||||||
|
Loading…
Reference in new issue