oagdedupe
latest
Getting Started
1. Installation
1.1. .dedupe
1.2. docker
1.3. postgres
1.4. label-studio
2. Settings
3. Dedupe
3.1. train model
3.2. start fastAPI
3.3. label-studio
3.4. predictions
4. Record Linkage
4.1. train model
4.2. start fastAPI
4.3. label-studio
4.4. predictions
User Guide
1. Intro
1.1. Scalability
1.2. Active Learning
1.3. Pipeline Overview
2. Key Terms
3. Generate Training Samples
4. Blocking
5. Distance
6. Classifier
7. Active Learning Loop
7.1. Initialization and First Pass
7.2. New Active Learning Loop
7.3. Predictions on Full Data
8. Clustering
Examples
Dedupe Example
Record Linkage Example
API Reference
API
BaseModel
Dedupe
Fapi
RecordLinkage
Database
SQLalchemy ORM Tables
Initialize
Database Interface
Blocker
block.blocking
block.forward
block.learner
block.sql
Distance
Distance
Cluster
Cluster
oagdedupe
Index
Edit on GitHub
Index
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
K
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
U
_
__init__() (oagdedupe.api.BaseModel method)
(oagdedupe.api.Dedupe method)
(oagdedupe.api.Fapi method)
(oagdedupe.api.RecordLinkage method)
(oagdedupe.block.blocking.Blocking method)
(oagdedupe.block.forward.Forward method)
(oagdedupe.block.learner.Conjunctions method)
(oagdedupe.cluster.cluster.ConnectedComponents method)
__post_init__() (oagdedupe.api.BaseModel method)
(oagdedupe.api.Dedupe method)
(oagdedupe.api.Fapi method)
(oagdedupe.api.RecordLinkage method)
(oagdedupe.block.blocking.Blocking method)
_abc_impl (oagdedupe.api.BaseModel attribute)
(oagdedupe.api.Dedupe attribute)
(oagdedupe.api.Fapi attribute)
(oagdedupe.api.RecordLinkage attribute)
(oagdedupe.block.blocking.Blocking attribute)
(oagdedupe.block.forward.Forward attribute)
(oagdedupe.cluster.cluster.ConnectedComponents attribute)
(oagdedupe.settings.Settings attribute)
(oagdedupe.settings.SettingsDB attribute)
(oagdedupe.settings.SettingsLabelStudio attribute)
(oagdedupe.settings.SettingsModel attribute)
(oagdedupe.settings.SettingsService attribute)
_check_rr() (oagdedupe.block.blocking.Blocking method)
A
api_key (oagdedupe.settings.SettingsLabelStudio attribute)
attributes (oagdedupe.settings.Settings attribute)
B
BaseModel (class in oagdedupe.api)
Blocking (class in oagdedupe.block.blocking)
build_forward_indices() (oagdedupe.block.forward.Forward method)
C
cluster (oagdedupe.api.BaseModel attribute)
compare_cols (oagdedupe.settings.Settings property)
conj (oagdedupe.block.blocking.Blocking attribute)
Conjunctions (class in oagdedupe.block.learner)
conjunctions_list (oagdedupe.block.learner.Conjunctions property)
ConnectedComponents (class in oagdedupe.cluster.cluster)
cpus (oagdedupe.settings.SettingsModel attribute)
D
db (oagdedupe.settings.Settings attribute)
(oagdedupe.settings.SettingsDB property)
db_schema (oagdedupe.settings.SettingsDB attribute)
Dedupe (class in oagdedupe.api)
dedupe (oagdedupe.settings.SettingsModel attribute)
description (oagdedupe.settings.SettingsLabelStudio attribute)
E
env_file (oagdedupe.settings.Settings.Config attribute)
env_nested_delimiter (oagdedupe.settings.Settings.Config attribute)
env_prefix (oagdedupe.settings.Settings.Config attribute)
F
Fapi (class in oagdedupe.api)
fast_api (oagdedupe.settings.Settings attribute)
fit_blocks() (oagdedupe.api.BaseModel method)
folder (oagdedupe.settings.Settings attribute)
Forward (class in oagdedupe.block.forward)
forward (oagdedupe.block.blocking.Blocking attribute)
G
get_connected_components() (oagdedupe.cluster.cluster.ConnectedComponents method)
get_connected_components_link() (oagdedupe.cluster.cluster.ConnectedComponents method)
get_df_cluster() (oagdedupe.cluster.cluster.ConnectedComponents method)
H
host (oagdedupe.settings.SettingsService attribute)
I
inherit_attr() (in module oagdedupe.utils)
initialize() (oagdedupe.api.BaseModel method)
(oagdedupe.api.Dedupe method)
(oagdedupe.api.Fapi method)
(oagdedupe.api.RecordLinkage method)
K
k (oagdedupe.settings.SettingsModel attribute)
L
label_studio (oagdedupe.settings.Settings attribute)
M
max_compare (oagdedupe.settings.SettingsModel attribute)
model (oagdedupe.settings.Settings attribute)
module
oagdedupe.api
oagdedupe.block.blocking
oagdedupe.block.forward
oagdedupe.block.learner
oagdedupe.cluster.cluster
oagdedupe.settings
oagdedupe.utils
N
n (oagdedupe.settings.SettingsModel attribute)
n_covered (oagdedupe.settings.SettingsModel attribute)
name (oagdedupe.settings.Settings attribute)
O
oagdedupe.api
module
oagdedupe.block.blocking
module
oagdedupe.block.forward
module
oagdedupe.block.learner
module
oagdedupe.cluster.cluster
module
oagdedupe.settings
module
oagdedupe.utils
module
optimizer (oagdedupe.block.blocking.Blocking attribute)
(oagdedupe.block.learner.Conjunctions attribute)
,
[1]
P
pairs (oagdedupe.block.blocking.Blocking attribute)
path_database (oagdedupe.settings.SettingsDB attribute)
path_model (oagdedupe.settings.SettingsModel attribute)
port (oagdedupe.settings.SettingsService attribute)
predict() (oagdedupe.api.BaseModel method)
R
RecordLinkage (class in oagdedupe.api)
recordlinkage() (in module oagdedupe.utils)
recordlinkage_both() (in module oagdedupe.utils)
recordlinkage_repeat() (in module oagdedupe.utils)
repo (oagdedupe.block.blocking.Blocking attribute)
(oagdedupe.block.forward.Forward attribute)
(oagdedupe.cluster.cluster.ConnectedComponents attribute)
repository (oagdedupe.block.forward.Forward attribute)
S
save() (oagdedupe.block.blocking.Blocking method)
save_comparisons() (oagdedupe.block.blocking.Blocking method)
Settings (class in oagdedupe.settings)
settings (oagdedupe.api.BaseModel attribute)
(oagdedupe.api.Dedupe attribute)
(oagdedupe.api.Fapi attribute)
(oagdedupe.api.RecordLinkage attribute)
(oagdedupe.block.forward.Forward attribute)
,
[1]
(oagdedupe.block.learner.Conjunctions attribute)
,
[1]
(oagdedupe.cluster.cluster.ConnectedComponents attribute)
Settings.Config (class in oagdedupe.settings)
SettingsDB (class in oagdedupe.settings)
SettingsLabelStudio (class in oagdedupe.settings)
SettingsModel (class in oagdedupe.settings)
SettingsService (class in oagdedupe.settings)
U
url (oagdedupe.settings.SettingsService property)