-
Notifications
You must be signed in to change notification settings - Fork 0
/
Formulaires.R
2370 lines (1947 loc) · 148 KB
/
Formulaires.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
# Démarrage ---------------------------------------------------------------
#charger librairies
library(RecordLinkage)
library(plyr)
library(dplyr)
library(readxl)
library(xlsx)
library(openxlsx)
library(stringr)
library(data.table)
library(Hmisc)
library(bigmemory)
options(bigmemory.typecast.warning=FALSE)
formattelephone<-function(x)
{
x<-gsub(' ','',x)
x<-gsub('O','0',x)
x<-gsub('\\+','',x)
x<-gsub("^33",'0',x)
x<-gsub('\\-','',x)
x<-str_pad(x, width=10, side="left", pad="0")
x<-sapply(x, function(x) {ifelse(grepl("00000000" ,x), NA, x)})
x<-sapply(x, function(x) {ifelse(grepl("12345" ,x), NA, x)})
x<-sapply(x, function(x) {ifelse(grepl("010101" ,x), NA, x)})
x<-sapply(x, function(x) {ifelse(grepl("999999" ,x), NA, x)})
x<-sapply(x, function(x) {ifelse(grepl("111111" ,x), NA, x)})
}
#import des données
full_tit<-fread("Full_Titulaires.csv") %>% as.data.table
regions<-read_excel("reg2016.xls",sheet="Feuille1")
dpt<-read_excel("depts2016.xls",sheet="Feuille1")
#préparation
regions<-regions[,c("REGION,C,2","NCC,C,70")]
colnames(regions)<-c("numReg","nomReg")
dpt<-dpt[,c("DEP,C,3","NCC,C,70","REGION,C,2")]
colnames(dpt)<-c("numDpt","nomDpt","numReg")
dpt<-join(dpt,regions,type="left",by="numReg")
dpt$nomReg<-gsub("(^|[[:space:]]|\\-)([[:alpha:]])", "\\1\\U\\2", tolower(dpt$nomReg), perl=TRUE)
dpt$nomReg <- gsub("\\-", "\n", dpt$nomReg)
dpt<-rbind(dpt,c("Etranger","Etranger","Etranger","Etranger"))
full_tit<-filter(full_tit,PRE_PERS_NOMUS!="XXXXXX")
full_tit<-filter(full_tit,PRE_PERS_NOMUS!="TEST")
full_tit<-filter(full_tit,PRE_PERS_PREUS!="TEST")
full_tit<-filter(full_tit,(nchar(full_tit$PRE_PERS_PREUS)>1))
full_tit[full_tit==""]<-NA
full_tit$PRE_DOSS_TELFIXE<-formattelephone(full_tit$PRE_DOSS_TELFIXE)
full_tit$PRE_DOSS_TELPORT<-formattelephone(full_tit$PRE_DOSS_TELPORT)
full_tit$ANNEE_NAISS<-substr(full_tit$PRE_PERS_DTNAI,6,10)
full_tit$PRE_DOSS_MAIL<-tolower(full_tit$PRE_DOSS_MAIL)
full_tit$PRE_DOSS_MAIL<-gsub(' ','',full_tit$PRE_DOSS_MAIL)
full_tit$PRE_DOSS_MAIL[grepl("pasdemail",full_tit$PRE_DOSS_MAIL)]<-NA
full_tit$PRE_DOSS_MAIL[grepl("adresse",full_tit$PRE_DOSS_MAIL)]<-NA
full_tit$PRE_DOSS_MAIL[grepl("pasde@",full_tit$PRE_DOSS_MAIL)]<-NA
full_tit$PRE_DOSS_MAIL[grepl("xxxx",full_tit$PRE_DOSS_MAIL)]<-NA
full_tit$PRE_DOSS_CP[full_tit$PRE_DOSS_CPAYS %nin% c(NA,"100","138","200","300","400","428","607","700","701","705")]<-"Etranger"
full_tit$PRE_DOSS_CP<-str_pad(full_tit$PRE_DOSS_CP, width=5, side="left", pad="0")
full_tit<-select(full_tit,-c(PRE_DOSS_CPAYS,PRE_PERS_TYPE))
full_tit$numDpt<-ifelse(full_tit$PRE_DOSS_CP=="Etranger", "Etranger", ifelse(grepl("^97",full_tit$PRE_DOSS_CP), substr(full_tit$PRE_DOSS_CP,1,3), substr(full_tit$PRE_DOSS_CP,1,2)))
full_tit<-join(full_tit,dpt,by="numDpt")
#séparation
temporaires<-filter(full_tit,PRE_PERS_MUNAPA>99000000) %>% as.data.table
titulaires<-filter(full_tit,PRE_PERS_MUNAPA<99000000) %>% as.data.table
gc(rm(formattelephone,dpt,regions),verbose=FALSE)
# Répartition géographique-------------------------------------------------
data.frame(t(table(titulaires$nomReg)),rownames = "Var2") %>% select(-Var2)
regtit<-t(table(titulaires$nomReg)) %>% as.data.frame %>% select(-Var1)
rownames(regtit)<-regtit[,1]
regtit<-select(regtit,-Var2)
regtemp<-t(table(temporaires$nomReg)) %>% as.data.frame %>% select(-Var1)
rownames(regtemp)<-regtemp[,1]
regtemp<-select(regtemp,-Var2)
regtemp<-regtemp/sum(regtemp)*100
regtit$Freq<-regtit$Freq/sum(regtit$Freq)*100
distriregion<-cbind(regtit,regtemp)
rownames(distriregion)<-c("Titulaires","Temporaires")
par(mar=c(6.5, 4, 2, 0))
barplot(distriregion,beside=TRUE,main="Distribution des titulaires \net temporaires par région",xlab="",ylab = "Pourcentage d'individus",las=2,cex.names=0.8,col=c("#A651D4", "#72C286"),ylim=c(0,20),legend.text=TRUE)
agetit<-table(titulaires$ANNEE_NAISS)
agetit<-as.data.frame(agetit/sum(agetit)*100)
agetemp<-table(temporaires$ANNEE_NAISS)
agetemp<-as.data.frame(agetemp/sum(agetemp)*100)
distriage<-as.data.table(t(merge(agetemp,agetit,by="Var1",all=TRUE)))
distriage[is.na(distriage)]<-0
distriage<-as.matrix(rbind(as.integer(distriage[1,]),as.numeric(distriage[2,]),as.numeric(distriage[3,])))
colnames(distriage)<-distriage[1,]
distriage<-distriage[-1,]
rownames(distriage)<-c("Titulaires","Temporaires")
par(mar=c(6.5, 4, 2, 0))
barplot(distriage,beside=TRUE,main="Distribution des titulaires \net temporaires par année de naissance",xlab="Année",ylab = "Pourcentage d'individus",las=2,cex.names=0.8,col=c("#A651D4", "#72C286"),ylim=c(0,4),legend.text=TRUE)
gc(rm(agetit,agetemp,regtit,regtemp,distriage,distriregion),verbose=FALSE)
temporaires<-within(temporaires,rm("numDpt","nomDpt","nomReg"))
titulaires<-within(titulaires,rm("numDpt","nomDpt","nomReg"))
# Match -------------------------------------------------------------------
#match exact
match<-inner_join(temporaires,titulaires,by="PRE_PERS_SS",suffix=c(".temp",".tit"))
#portable<-as.data.table(inner_join(filter(temporaires,!is.na(PRE_DOSS_TELPORT)),filter(titulaires,!is.na(PRE_DOSS_TELPORT)),by="PRE_DOSS_TELPORT",suffix=c(".temp",".tit")))
#email<-as.data.table(inner_join(filter(temporaires,!is.na(PRE_DOSS_MAIL)),filter(titulaires,!is.na(PRE_DOSS_MAIL)),by="PRE_DOSS_MAIL",suffix=c(".temp",".tit")))
match$PRE_PERS_SS.tit<-match$PRE_PERS_SS
match$PRE_PERS_SS.temp<-match$PRE_PERS_SS
match<-select(match,-PRE_PERS_SS)
match$Methode<-"SS"
#SS<-select(SS,c(PRE_PERS_MUNAPA.temp,PRE_PERS_NOMUS.temp,PRE_PERS_NOM.temp,PRE_PERS_PREUS.temp,PRE_PERS_DTNAI.temp,ANNEE_NAISS.temp,PRE_PERS_SS.temp,PRE_DOSS_TELFIXE.temp,PRE_DOSS_TELPORT.temp,PRE_DOSS_MAIL.temp,PRE_DOSS_RUE.temp,PRE_DOSS_CRUE.temp,PRE_DOSS_CP.temp,PRE_DOSS_VILLE.temp,numReg.temp,PRE_PERS_MUNAPA.tit,PRE_PERS_NOMUS.tit,PRE_PERS_NOM.tit,PRE_PERS_PREUS.tit,PRE_PERS_DTNAI.tit,ANNEE_NAISS.tit,PRE_PERS_SS.tit,PRE_DOSS_TELFIXE.tit,PRE_DOSS_TELPORT.tit,PRE_DOSS_MAIL.tit,PRE_DOSS_RUE.tit,PRE_DOSS_CRUE.tit,PRE_DOSS_CP.tit,PRE_DOSS_VILLE.tit,numReg.tit,Methode))
#portable$PRE_DOSS_TELPORT.tit<-portable$PRE_DOSS_TELPORT
#portable$PRE_DOSS_TELPORT.temp<-portable$PRE_DOSS_TELPORT
#portable<-select(portable,-PRE_DOSS_TELPORT)
#portable$Methode<-"Portable"
#email$PRE_DOSS_MAIL.tit<-email$PRE_DOSS_MAIL
#email$PRE_DOSS_MAIL.temp<-email$PRE_DOSS_MAIL
#email<-select(email,-PRE_DOSS_MAIL)
#email$Methode<-"email"
#match<-rbind(SS,portable,email) %>% as.data.table()
match<-distinct(match,PRE_PERS_MUNAPA.temp,PRE_PERS_MUNAPA.tit,.keep_all = TRUE)
match<-select(match,c(PRE_PERS_MUNAPA.temp,PRE_PERS_NOMUS.temp,PRE_PERS_NOM.temp,PRE_PERS_PREUS.temp,PRE_PERS_DTNAI.temp,ANNEE_NAISS.temp,PRE_PERS_SS.temp,PRE_DOSS_TELFIXE.temp,PRE_DOSS_TELPORT.temp,PRE_DOSS_MAIL.temp,PRE_DOSS_RUE.temp,PRE_DOSS_CRUE.temp,PRE_DOSS_CP.temp,PRE_DOSS_VILLE.temp,numReg.temp,PRE_PERS_MUNAPA.tit,PRE_PERS_NOMUS.tit,PRE_PERS_NOM.tit,PRE_PERS_PREUS.tit,PRE_PERS_DTNAI.tit,ANNEE_NAISS.tit,PRE_PERS_SS.tit,PRE_DOSS_TELFIXE.tit,PRE_DOSS_TELPORT.tit,PRE_DOSS_MAIL.tit,PRE_DOSS_RUE.tit,PRE_DOSS_CRUE.tit,PRE_DOSS_CP.tit,PRE_DOSS_VILLE.tit,numReg.tit,Methode))
#gc(rm(email,portable,SS),verbose=FALSE)
#supprimer les résultats positifs de la liste pour les raccrochements qui suivent
temporaires<-filter(temporaires,!(PRE_PERS_MUNAPA %in% match$PRE_PERS_MUNAPA.temp))
titulaires<-filter(titulaires,!(PRE_PERS_MUNAPA %in% match$PRE_PERS_MUNAPA.tit))
#record linkage
taille<-nrow(titulaires)/200
poids<-big.matrix(nrow=(taille*nrow(temporaires)+500),ncol=1,type="short")
titulaires0<-titulaires[1:taille,]
reclink<-compare.linkage(temporaires,titulaires0,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-getPairs(reclink,single.rows = TRUE, show="links")
possible_links<-getPairs(reclink,single.rows = TRUE, show="possible")
poids[1:length(reclink$Wdata)]<-reclink$Wdata
paires<-as.numeric(nrow(reclink$pairs))
gc(rm(titulaires0,reclink),verbose = FALSE)
titulaires1<-titulaires[(1*taille+1):(2*taille),]
reclink<-compare.linkage(temporaires,titulaires1,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires1,reclink),verbose = FALSE)
titulaires2<-titulaires[(2*taille+1):(3*taille),]
reclink<-compare.linkage(temporaires,titulaires2,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires2,reclink),verbose = FALSE)
titulaires3<-titulaires[(3*taille+1):(4*taille),]
reclink<-compare.linkage(temporaires,titulaires3,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires3,reclink),verbose = FALSE)
titulaires4<-titulaires[(4*taille+1):(5*taille),]
reclink<-compare.linkage(temporaires,titulaires4,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires4,reclink),verbose = FALSE)
titulaires5<-titulaires[(5*taille+1):(6*taille),]
reclink<-compare.linkage(temporaires,titulaires5,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires5,reclink),verbose = FALSE)
titulaires6<-titulaires[(6*taille+1):(7*taille),]
reclink<-compare.linkage(temporaires,titulaires6,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires6,reclink),verbose = FALSE)
titulaires7<-titulaires[(7*taille+1):(8*taille),]
reclink<-compare.linkage(temporaires,titulaires7,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires7,reclink),verbose = FALSE)
titulaires8<-titulaires[(8*taille+1):(9*taille),]
reclink<-compare.linkage(temporaires,titulaires8,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires8,reclink),verbose = FALSE)
titulaires9<-titulaires[(9*taille+1):(10*taille),]
reclink<-compare.linkage(temporaires,titulaires9,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires9,reclink),verbose = FALSE)
titulaires10<-titulaires[(10*taille+1):(11*taille),]
reclink<-compare.linkage(temporaires,titulaires10,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires10,reclink),verbose = FALSE)
titulaires11<-titulaires[(11*taille+1):(12*taille),]
reclink<-compare.linkage(temporaires,titulaires11,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires11,reclink),verbose = FALSE)
titulaires12<-titulaires[(12*taille+1):(13*taille),]
reclink<-compare.linkage(temporaires,titulaires12,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires12,reclink),verbose = FALSE)
titulaires13<-titulaires[(13*taille+1):(14*taille),]
reclink<-compare.linkage(temporaires,titulaires13,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires13,reclink),verbose = FALSE)
titulaires14<-titulaires[(14*taille+1):(15*taille),]
reclink<-compare.linkage(temporaires,titulaires14,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires14,reclink),verbose = FALSE)
titulaires15<-titulaires[(15*taille+1):(16*taille),]
reclink<-compare.linkage(temporaires,titulaires15,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires15,reclink),verbose = FALSE)
titulaires16<-titulaires[(16*taille+1):(17*taille),]
reclink<-compare.linkage(temporaires,titulaires16,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires16,reclink),verbose = FALSE)
titulaires17<-titulaires[(17*taille+1):(18*taille),]
reclink<-compare.linkage(temporaires,titulaires17,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires17,reclink),verbose = FALSE)
titulaires18<-titulaires[(18*taille+1):(19*taille),]
reclink<-compare.linkage(temporaires,titulaires18,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires18,reclink),verbose = FALSE)
titulaires19<-titulaires[(19*taille+1):(20*taille),]
reclink<-compare.linkage(temporaires,titulaires19,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires19,reclink),verbose = FALSE)
titulaires20<-titulaires[(20*taille+1):(21*taille),]
reclink<-compare.linkage(temporaires,titulaires20,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires20,reclink),verbose = FALSE)
titulaires21<-titulaires[(21*taille+1):(22*taille),]
reclink<-compare.linkage(temporaires,titulaires21,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires21,reclink),verbose = FALSE)
titulaires22<-titulaires[(22*taille+1):(23*taille),]
reclink<-compare.linkage(temporaires,titulaires22,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires22,reclink),verbose = FALSE)
titulaires23<-titulaires[(23*taille+1):(24*taille),]
reclink<-compare.linkage(temporaires,titulaires23,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires23,reclink),verbose = FALSE)
titulaires24<-titulaires[(24*taille+1):(25*taille),]
reclink<-compare.linkage(temporaires,titulaires24,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires24,reclink),verbose = FALSE)
titulaires25<-titulaires[(25*taille+1):(26*taille),]
reclink<-compare.linkage(temporaires,titulaires25,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires25,reclink),verbose = FALSE)
titulaires26<-titulaires[(26*taille+1):(27*taille),]
reclink<-compare.linkage(temporaires,titulaires26,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires26,reclink),verbose = FALSE)
titulaires27<-titulaires[(27*taille+1):(28*taille),]
reclink<-compare.linkage(temporaires,titulaires27,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires27,reclink),verbose = FALSE)
titulaires28<-titulaires[(28*taille+1):(29*taille),]
reclink<-compare.linkage(temporaires,titulaires28,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires28,reclink),verbose = FALSE)
titulaires29<-titulaires[(29*taille+1):(30*taille),]
reclink<-compare.linkage(temporaires,titulaires29,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires29,reclink),verbose = FALSE)
titulaires30<-titulaires[(30*taille+1):(31*taille),]
reclink<-compare.linkage(temporaires,titulaires30,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires30,reclink),verbose = FALSE)
titulaires31<-titulaires[(31*taille+1):(32*taille),]
reclink<-compare.linkage(temporaires,titulaires31,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires31,reclink),verbose = FALSE)
titulaires32<-titulaires[(32*taille+1):(33*taille),]
reclink<-compare.linkage(temporaires,titulaires32,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires32,reclink),verbose = FALSE)
titulaires33<-titulaires[(33*taille+1):(34*taille),]
reclink<-compare.linkage(temporaires,titulaires33,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires33,reclink),verbose = FALSE)
titulaires34<-titulaires[(34*taille+1):(35*taille),]
reclink<-compare.linkage(temporaires,titulaires34,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires34,reclink),verbose = FALSE)
titulaires35<-titulaires[(35*taille+1):(36*taille),]
reclink<-compare.linkage(temporaires,titulaires35,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires35,reclink),verbose = FALSE)
titulaires36<-titulaires[(36*taille+1):(37*taille),]
reclink<-compare.linkage(temporaires,titulaires36,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires36,reclink),verbose = FALSE)
titulaires37<-titulaires[(37*taille+1):(38*taille),]
reclink<-compare.linkage(temporaires,titulaires37,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires37,reclink),verbose = FALSE)
titulaires38<-titulaires[(38*taille+1):(39*taille),]
reclink<-compare.linkage(temporaires,titulaires38,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires38,reclink),verbose = FALSE)
titulaires39<-titulaires[(39*taille+1):(40*taille),]
reclink<-compare.linkage(temporaires,titulaires39,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires39,reclink),verbose = FALSE)
titulaires40<-titulaires[(40*taille+1):(41*taille),]
reclink<-compare.linkage(temporaires,titulaires40,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires40,reclink),verbose = FALSE)
titulaires41<-titulaires[(41*taille+1):(42*taille),]
reclink<-compare.linkage(temporaires,titulaires41,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires41,reclink),verbose = FALSE)
titulaires42<-titulaires[(42*taille+1):(43*taille),]
reclink<-compare.linkage(temporaires,titulaires42,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires42,reclink),verbose = FALSE)
titulaires43<-titulaires[(43*taille+1):(44*taille),]
reclink<-compare.linkage(temporaires,titulaires43,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires43,reclink),verbose = FALSE)
titulaires44<-titulaires[(44*taille+1):(45*taille),]
reclink<-compare.linkage(temporaires,titulaires44,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires44,reclink),verbose = FALSE)
titulaires45<-titulaires[(45*taille+1):(46*taille),]
reclink<-compare.linkage(temporaires,titulaires45,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires45,reclink),verbose = FALSE)
titulaires46<-titulaires[(46*taille+1):(47*taille),]
reclink<-compare.linkage(temporaires,titulaires46,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires46,reclink),verbose = FALSE)
titulaires47<-titulaires[(47*taille+1):(48*taille),]
reclink<-compare.linkage(temporaires,titulaires47,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires47,reclink),verbose = FALSE)
titulaires48<-titulaires[(48*taille+1):(49*taille),]
reclink<-compare.linkage(temporaires,titulaires48,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires48,reclink),verbose = FALSE)
titulaires49<-titulaires[(49*taille+1):(50*taille),]
reclink<-compare.linkage(temporaires,titulaires49,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires49,reclink),verbose = FALSE)
titulaires50<-titulaires[(50*taille+1):(51*taille),]
reclink<-compare.linkage(temporaires,titulaires50,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires50,reclink),verbose = FALSE)
titulaires51<-titulaires[(51*taille+1):(52*taille),]
reclink<-compare.linkage(temporaires,titulaires51,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires51,reclink),verbose = FALSE)
titulaires52<-titulaires[(52*taille+1):(53*taille),]
reclink<-compare.linkage(temporaires,titulaires52,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires52,reclink),verbose = FALSE)
titulaires53<-titulaires[(53*taille+1):(54*taille),]
reclink<-compare.linkage(temporaires,titulaires53,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires53,reclink),verbose = FALSE)
titulaires54<-titulaires[(54*taille+1):(55*taille),]
reclink<-compare.linkage(temporaires,titulaires54,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires54,reclink),verbose = FALSE)
titulaires55<-titulaires[(55*taille+1):(56*taille),]
reclink<-compare.linkage(temporaires,titulaires55,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires55,reclink),verbose = FALSE)
titulaires56<-titulaires[(56*taille+1):(57*taille),]
reclink<-compare.linkage(temporaires,titulaires56,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires56,reclink),verbose = FALSE)
titulaires57<-titulaires[(57*taille+1):(58*taille),]
reclink<-compare.linkage(temporaires,titulaires57,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires57,reclink),verbose = FALSE)
titulaires58<-titulaires[(58*taille+1):(59*taille),]
reclink<-compare.linkage(temporaires,titulaires58,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires58,reclink),verbose = FALSE)
titulaires59<-titulaires[(59*taille+1):(60*taille),]
reclink<-compare.linkage(temporaires,titulaires59,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires59,reclink),verbose = FALSE)
titulaires60<-titulaires[(60*taille+1):(61*taille),]
reclink<-compare.linkage(temporaires,titulaires60,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires60,reclink),verbose = FALSE)
titulaires61<-titulaires[(61*taille+1):(62*taille),]
reclink<-compare.linkage(temporaires,titulaires61,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires61,reclink),verbose = FALSE)
titulaires62<-titulaires[(62*taille+1):(63*taille),]
reclink<-compare.linkage(temporaires,titulaires62,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires62,reclink),verbose = FALSE)
titulaires63<-titulaires[(63*taille+1):(64*taille),]
reclink<-compare.linkage(temporaires,titulaires63,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires63,reclink),verbose = FALSE)
titulaires64<-titulaires[(64*taille+1):(65*taille),]
reclink<-compare.linkage(temporaires,titulaires64,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires64,reclink),verbose = FALSE)
titulaires65<-titulaires[(65*taille+1):(66*taille),]
reclink<-compare.linkage(temporaires,titulaires65,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires65,reclink),verbose = FALSE)
titulaires66<-titulaires[(66*taille+1):(67*taille),]
reclink<-compare.linkage(temporaires,titulaires66,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires66,reclink),verbose = FALSE)
titulaires67<-titulaires[(67*taille+1):(68*taille),]
reclink<-compare.linkage(temporaires,titulaires67,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires67,reclink),verbose = FALSE)
titulaires68<-titulaires[(68*taille+1):(69*taille),]
reclink<-compare.linkage(temporaires,titulaires68,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires68,reclink),verbose = FALSE)
titulaires69<-titulaires[(69*taille+1):(70*taille),]
reclink<-compare.linkage(temporaires,titulaires69,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires69,reclink),verbose = FALSE)
titulaires70<-titulaires[(70*taille+1):(71*taille),]
reclink<-compare.linkage(temporaires,titulaires70,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires70,reclink),verbose = FALSE)
titulaires71<-titulaires[(71*taille+1):(72*taille),]
reclink<-compare.linkage(temporaires,titulaires71,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires71,reclink),verbose = FALSE)
titulaires72<-titulaires[(72*taille+1):(73*taille),]
reclink<-compare.linkage(temporaires,titulaires72,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires72,reclink),verbose = FALSE)
titulaires73<-titulaires[(73*taille+1):(74*taille),]
reclink<-compare.linkage(temporaires,titulaires73,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires73,reclink),verbose = FALSE)
titulaires74<-titulaires[(74*taille+1):(75*taille),]
reclink<-compare.linkage(temporaires,titulaires74,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires74,reclink),verbose = FALSE)
titulaires75<-titulaires[(75*taille+1):(76*taille),]
reclink<-compare.linkage(temporaires,titulaires75,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires75,reclink),verbose = FALSE)
titulaires76<-titulaires[(76*taille+1):(77*taille),]
reclink<-compare.linkage(temporaires,titulaires76,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires76,reclink),verbose = FALSE)
titulaires77<-titulaires[(77*taille+1):(78*taille),]
reclink<-compare.linkage(temporaires,titulaires77,strcmpfun = jarowinkler,strcmp = c(2,3,4,5,7,8,9,10,12),blockfld = c(14,15), exclude = c(1,6,11,13,14,15))
reclink<-fsWeights(reclink,m=c(0.9,0.8,0.9,0.8,0.5,0.5,0.4,0.4,0.3),u=reclink$frequencies)
reclink<-fsClassify(reclink,threshold.upper=35,threshold.lower=20)
links<-rbind(links,getPairs(reclink,single.rows = TRUE, show="links"))
possible_links<-rbind(possible_links,getPairs(reclink,single.rows = TRUE, show="possible"))
poids[(paires+1):(paires+length(reclink$Wdata))]<-reclink$Wdata
paires<-as.numeric(paires+nrow(reclink$pairs))
gc(rm(titulaires77,reclink),verbose = FALSE)
titulaires78<-titulaires[(78*taille+1):(79*taille),]