trafilatura 0.3.0

Extract readable content, comments, and metadata from web pages
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
{"file": "vancouversun.com.microsoft.html", "url": "https://vancouversun.com/technology/microsoft-moves-to-erase-its-carbon-footprint-from-the-atmosphere-in-climate-push/wcm/76e426d9-56de-40ad-9504-18d5101013d2", "text_len": 4304, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Microsoft Corp said on Thursday", "found": true}, {"type": "with", "string": "It was not immediately clear if", "found": true}, {"type": "without", "string": "Reuters files", "found": false}, {"type": "without", "string": "turns CO2 into soap", "found": false}, {"type": "without", "string": "I consent to receiving", "found": false}]}
{"file": "reuters.com.parasite.html", "url": "https://www.reuters.com/article/us-awards-sag/parasite-scores-upset-at-sag-awards-boosting-oscar-chances-idUSKBN1ZI0EH", "text_len": 3971, "tp": 3, "fn": 0, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "cementing their roles", "found": true}, {"type": "with", "string": "Despite an unknown cast,", "found": true}, {"type": "with", "string": "Additional reporting by", "found": true}, {"type": "without", "string": "Related Coverage", "found": false}, {"type": "without", "string": "4 Min Read", "found": false}, {"type": "without", "string": "The Thomson Reuters Trust Principles", "found": true}, {"type": "without", "string": "Factbox: Key winners", "found": false}]}
{"file": "mywakenews.wordpress.com.psyop.html", "url": "https://mywakenews.wordpress.com/2016/07/09/nwo-psyop-unitedwestrike-radio-marathon/", "text_len": 30295, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "diesen Bastarden diese Worte einvernehmlicher Verkehr in den Mund???", "found": true}, {"type": "with", "string": "Kritische Betrachter haben bereits sehr viele Indizien zusammengetragen", "found": true}, {"type": "with", "string": "und unsere Wahrnehmung gefangen gehalten, manipuliert und gesteuert", "found": true}, {"type": "without", "string": "For all who want to wake up!", "found": false}, {"type": "without", "string": "Erstelle eine kostenlose Website oder Blog \u2013 auf WordPress.com", "found": false}, {"type": "without", "string": "Meine pers\u00f6nlichen Informationen nicht verkaufen", "found": false}]}
{"file": "leukefeld-handball.de.leukefeld.html", "url": "https://leukefeld-handball.de/dago-leukefeld-wird-botschafter-des-sports-der-ifzw-impulsstiftung/", "text_len": 3830, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die ifzw impulsstiftung und Dago Leukefeld besiegeln ihre gute", "found": true}, {"type": "with", "string": "mit Ihm und auf spannende Projekte im Vereinssport\u201c, so Mechthild A\u00dfmann.", "found": true}, {"type": "with", "string": "in die beteiligten Vereine beigetreten sind. F\u00fcr uns ein tolles Ergebnis.", "found": true}, {"type": "without", "string": "\u00a9 2017 Dago Leukefeld Handball", "found": false}, {"type": "without", "string": "Lieferzeit: 9-12 Tage", "found": false}, {"type": "without", "string": "Hier geht es zu den", "found": false}]}
{"file": "chabermu.wordpress.com.expertenwissen.html", "url": "https://chabermu.wordpress.com/2015/09/02/windows-expertenwissen-per-update-spioniert-microsoft-nun-auch-windows-7-8-und-8-1-aus-microsoft-privacy-windows10-chabermu/", "text_len": 5398, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nun hat es der Softwarekonzern auch auf die Nutzerdaten", "found": true}, {"type": "with", "string": "Klicken Sie die betroffenen, optionalen Windows-Updates", "found": true}, {"type": "with", "string": "Wann jedoch Microsoft diese Abhilfe gegen seine Abh\u00f6r-Updates blockiert", "found": true}, {"type": "without", "string": "\u00a9 since 2010", "found": false}, {"type": "without", "string": "News vom Computerarchiv M\u00fcnchen", "found": false}, {"type": "without", "string": "Gib deine E-Mail-Adresse ein", "found": false}]}
{"file": "jobsnhire.com.health.html", "url": "http://www.jobsnhire.com/articles/35030/20160214/need-know-cvs-health.htm", "text_len": 2135, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "is all about helping people who are treading", "found": true}, {"type": "with", "string": "CVS Health also helps those diagnosed with complex", "found": true}, {"type": "with", "string": "17.6 percent to $2.7 billion. It seems CVS Health is really", "found": true}, {"type": "without", "string": "Get the Most Popular Jobs&Hire Stories in a Weekly Newsletter", "found": false}, {"type": "without", "string": " acceptance of our Terms and Conditions of Use and Privacy Policy. ", "found": false}, {"type": "without", "string": "t Career Options, Job Titles and Descriptions", "found": false}]}
{"file": "linksfraktion.de-Abzocke.html", "url": "https://www.linksfraktion.de/themen/nachrichten/detail/abzocke-wird-als-klimaschutz-verkauft/", "text_len": 8990, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "der Linken-Vorsitzende", "found": true}, {"type": "with", "string": "Aber was wir im Moment", "found": true}, {"type": "with", "string": "Unternehmen durch immer", "found": true}, {"type": "without", "string": "Kein Recht auf Faulheit", "found": false}, {"type": "without", "string": "Im Wortlaut von Katja", "found": false}, {"type": "without", "string": "Pressemitteilung von", "found": false}]}
{"file": "arbeitsagentur.de-arbeitsmarkt.html", "url": "https://www.arbeitsagentur.de/news/arbeitsmarkt-2022", "text_len": 1946, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "sagte der Vorstand Regionen der Bundesagentur", "found": true}, {"type": "with", "string": "Besch\u00e4ftigung nahm saisonbereinigt von Oktober", "found": true}, {"type": "with", "string": "Anzeigen wurde vom 1. bis einschlie\u00dflich", "found": true}, {"type": "without", "string": "Auf der Seite Aktuelle Meldungen 2021", "found": false}, {"type": "without", "string": "auf der Seite Entwicklung des", "found": false}, {"type": "without", "string": "Arbeitsmarkts in den Vorjahren lesen", "found": false}]}
{"file": "giromatch.com.kredit.html", "url": "https://www.giromatch.com/online-kredit/1000-euro-kredit", "text_len": 4540, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Fragen Sie noch heute den Kredit an und Sie haben bestenfalls morgen", "found": true}, {"type": "with", "string": "Grundeinkommen bzw. keine \u00dcberschuldung", "found": true}, {"type": "with", "string": "mit Express\u00fcberweisung auch als Blitzkredit auszahlbar.", "found": true}, {"type": "without", "string": "info@giromatch.com", "found": false}, {"type": "without", "string": "Ausgew\u00e4hlte Kreditprodukte", "found": false}, {"type": "without", "string": "Bewerten Sie dieses Produkt", "found": false}]}
{"file": "chemietechnik.de.forschungsgruppe fuer biotechnologie.html", "url": "https://www.chemietechnik.de/sicherheit-umwelt/covestro-startet-neue-forschungsgruppe-fuer-biotechnologie-843.html", "text_len": 3527, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der Kunststoff-Hersteller Covestro will", "found": false}, {"type": "with", "string": "Neues Labor in Leverkusen eingerichtet", "found": true}, {"type": "with", "string": "Auch HDMA mithilfe von Biotechnologie produziert", "found": true}, {"type": "without", "string": "Auch interessant", "found": false}, {"type": "without", "string": "Diskutieren Sie mit", "found": false}, {"type": "without", "string": "Aktuellste Beitr\u00e4ge", "found": false}]}
{"file": "thisisjanewayne.com.bauch.html", "url": "https://www.thisisjanewayne.com/news/2022/09/14/von-bauchgeburten-und-falschen-gefuehlen-im-richtigen-sein/", "text_len": 12781, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u201eGeht los!\u201c, schrie", "found": true}, {"type": "with", "string": "Ben\u00f6tigen Sie psychologische", "found": true}, {"type": "with", "string": "W\u00e4hrend der Franz\u00f6sischen Revolution", "found": true}, {"type": "without", "string": "TAGS:", "found": false}, {"type": "without", "string": "Mehr von", "found": false}, {"type": "without", "string": "11 KOMMENTARE", "found": false}]}
{"file": "simmeltalzeitung.ch-Trinkwasser.html", "url": "http://simmentalzeitung.ch/Simmental/Boltigen/Trinkwasser-in-Schwarzenmatt-belastet-43157.html", "text_len": 1072, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Auf Nachfrage f\u00fchrte die Gemeinde weiter aus", "found": true}, {"type": "with", "string": "dass \u00abgeringe Mengen\u00bb des Bakteriums Escherichia coli im Rahmen", "found": true}, {"type": "with", "string": "von routinem\u00e4ssigen Probenuntersuchungen gefunden wurden", "found": true}, {"type": "without", "string": "INTERESSANTE ARTIKEL", "found": false}, {"type": "without", "string": "Artikel bewerten", "found": false}, {"type": "without", "string": "Cookies erleichtern die Bereitstellung unserer Dienste", "found": false}]}
{"file": "thebigbone.wordpress.com.ueberforderung.html", "url": "https://thebigbone.wordpress.com/2017/04/13/die-ueberforderung-durch-ueberangebote/", "text_len": 4113, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bist du auch schon mal die Regale im Supermarkt", "found": true}, {"type": "with", "string": "Wir sind die Opfer einer Gesellschaft", "found": true}, {"type": "with", "string": "Die Beschleunigung im Privaten liegt", "found": true}, {"type": "without", "string": "Gib deine E-Mail-Adresse ein", "found": false}, {"type": "without", "string": "Kommentare zu", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}]}
{"file": "abenteuer-astronomie.de.plejaden.html", "url": "https://abenteuer-astronomie.de/astrofoto-community/plejaden-m45-2/", "text_len": 595, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nun nicht im Staub, sondern mit ausgepr\u00e4gten Sternstrahlen", "found": true}, {"type": "with", "string": "Art der Aufnahme: Digitalfoto", "found": true}, {"type": "with", "string": "Kasberg im Frankenland", "found": true}, {"type": "without", "string": "Hinterlasse jetzt einen Kommentar", "found": false}, {"type": "without", "string": "Sie wollen Deep-Sky-Objekte am Himmel", "found": false}, {"type": "without", "string": "Abenteuer Astronomie war eine Zeitschrift", "found": false}]}
{"file": "0a3108e507c54157a95fe7a1338f5e9c.html", "url": "https://www.investmentwatchblog.com/biggest-money-laundering-scheme-in-history-uncovered-in-ukraine/", "text_len": 5082, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Jewish oligarchs Igor Kolomoisky and", "found": true}, {"type": "with", "string": "The Chairwoman of Ukraine\u2019s Central Bank", "found": true}, {"type": "with", "string": "Now as to those missing IMF billions, ", "found": true}, {"type": "without", "string": "Privacy & Cookies: This site uses", "found": false}, {"type": "without", "string": "If you\u2019re running an ad-blocker", "found": false}, {"type": "without", "string": "Don't have time to read every single post", "found": false}]}
{"file": "infocomcgt.fr.caisse.html", "url": "https://www.infocomcgt.fr/caisse-de-solidarite-financiere/", "text_len": 6278, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "ou tout autre r\u00e9gression sociale", "found": true}, {"type": "with", "string": "1 545 500 EUROS", "found": true}, {"type": "with", "string": "Reportage JT 13 heures de France 2", "found": true}, {"type": "without", "string": "On n\u2019est pas de la chair \u00e0 patron", "found": false}, {"type": "without", "string": "Votre adresse e-mail ne sera pas publi\u00e9e", "found": false}, {"type": "without", "string": "Contactez vos repr\u00e9sentants", "found": false}]}
{"file": "geschichtedergegenwart.ch.foucault.html", "url": "https://geschichtedergegenwart.ch/mit-foucault-die-pandemie-verstehen/", "text_len": 16174, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u201e\u00dcber\u00adle\u00adbens\u201c aller demo\u00adkra\u00adti\u00adschen Hinder\u00adnisse und k\u00f6nnen endlich", "found": false}, {"type": "with", "string": "Daher sei das \u201eVerh\u00e4ltnis zu sich selbst\u201c, wie Foucault", "found": true}, {"type": "with", "string": "einge\u00adf\u00fchrt, um das Auftau\u00adchen neuer poli\u00adti\u00adscher Ziele und Stra\u00adte\u00adgien in", "found": false}, {"type": "without", "string": "Die Versu\u00adchungen des Abso\u00adlu\u00adtismus.", "found": false}, {"type": "without", "string": "Sinn ohne Wort. Vom \u201eVolks\u00adthum\u201c und anderen \u201eThum\u00adheiten\u201c", "found": false}, {"type": "without", "string": "lehrt Geschichte der Neu\u00adzeit", "found": false}]}
{"file": "eatwhattonight.com.stir.html", "url": "https://eatwhattonight.com/2020/09/vegan-styled-char-kway-teow-stir-fry-flat-rice-noodles/", "text_len": 2297, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Once in a while, I liked to go vegan", "found": true}, {"type": "with", "string": "With 2 tbsp oil left in the wok", "found": true}, {"type": "with", "string": "120g kway teow (flat rice noodles)\u2063", "found": false}, {"type": "without", "string": "I am Joyce from Sunny Singapore", "found": false}, {"type": "without", "string": "Enter your keywords", "found": false}, {"type": "without", "string": "Print Recipe", "found": false}]}
{"file": "ekiba.de-trauer.html", "url": "https://www.ekiba.de/detail/nachricht-seite/id/35204-trauern-digital-am-ewigkeitssonntag/?default=true", "text_len": 2770, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gottesdiensten ihrer Gemeinden", "found": true}, {"type": "with", "string": "Namen von Verstorbenen", "found": true}, {"type": "with", "string": " und dazu laden wir herzlich ein", "found": true}, {"type": "without", "string": "Kirchengemeinde braucht klares Ziel\u201c", "found": false}, {"type": "without", "string": "Erlebnisraum Kirche", "found": false}, {"type": "without", "string": "weitere Veranstaltungen ...", "found": false}]}
{"file": "chineselyrics4u.com.zhineng.html", "url": "http://www.chineselyrics4u.com/2011/07/zhi-neng-xiang-nian-ni-jam-hsiao-jing.html", "text_len": 646, "tp": 2, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "\u5c31\u653e\u5fc3\u53bb\u5427", "found": true}, {"type": "with", "string": "Repeat Chorus", "found": true}, {"type": "without", "string": "Posted by K A", "found": false}, {"type": "without", "string": "Older post", "found": false}, {"type": "without", "string": "Thank you for your support!", "found": false}, {"type": "without", "string": "Follower", "found": false}]}
{"file": "together.ch.schaffhausen.html", "url": "https://together.ch/de/karriere/events-messen/119-sprungbrett-event-schaffhausen", "text_len": 995, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "f\u00fcr eine erfolgreiche Zukunft!", "found": true}, {"type": "with", "string": "In einer lockeren Atmosph\u00e4re", "found": false}, {"type": "with", "string": "Anreise", "found": false}, {"type": "without", "string": "Abonniere unseren Newsletter", "found": false}, {"type": "without", "string": "Partner f\u00fcr Studium", "found": false}, {"type": "without", "string": "F\u00fcr Hochschulen", "found": false}]}
{"file": "trainingline-english.de.einzeltraining.html", "url": "https://www.trainingline-english.de/am-telefon-1/einzeltraining/", "text_len": 2455, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Beim Englischtraining am Telefon", "found": true}, {"type": "with", "string": "Das Englischtraining am Telefon", "found": true}, {"type": "with", "string": "Und mit jedem Satz w\u00e4chst", "found": true}, {"type": "without", "string": "51467 Bergisch Gladbach", "found": false}, {"type": "without", "string": "...und fast unbemerkt", "found": false}, {"type": "without", "string": "+49 (0)2202 -2809436", "found": false}]}
{"file": "0a6291ebbce449b3b04256b43c73e39d.html", "url": "https://wien.orf.at/stories/3017954/", "text_len": 2394, "tp": 0, "fn": 3, "fp": 0, "tn": 5, "details": [{"type": "with", "string": "Die Opernball-Grande-Dame und Burgschauspielerin Lotte Tobisch", "found": false}, {"type": "with", "string": "Zahlreiche Auszeichnungen", "found": false}, {"type": "with", "string": "Auch bei der j\u00fcngsten Wahl", "found": false}, {"type": "without", "string": "ORF2 zeigt in memoriam", "found": false}, {"type": "without", "string": "die Funktionalit\u00e4t dieser Website zu gew\u00e4hrleisten", "found": false}, {"type": "without", "string": "Aktuell in wien", "found": false}, {"type": "without", "string": "Viele Freunde, Verwandte und Fans haben sich", "found": false}, {"type": "without", "string": "Georg Hochmuth", "found": false}]}
{"file": "flvw.de-hallenmeisterschaften.html", "url": "https://www.flvw.de/news/detail/joana-herrmann-fliegt-bei-den-flvw-hallenmeisterschaften-ueber-178-meter/", "text_len": 3440, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Eine Woche nach seinem Titelgewinn", "found": true}, {"type": "with", "string": "Sekunden bedeutet f\u00fcr sie eine", "found": true}, {"type": "with", "string": "dreimal vergeblich an 1,80 Meter", "found": true}, {"type": "without", "string": "Themenrelevante Nachrichten", "found": false}, {"type": "without", "string": "Dreisprung auf 13,93 Meter", "found": false}, {"type": "without", "string": "im Kugelsto\u00dfen", "found": false}]}
{"file": "paginasiete.bo-carabineros.html", "url": "https://www.paginasiete.bo/seguridad/2022/5/3/policia-anuncia-coordinacion-con-carabineros-para-investigar-otros-casos-de-robo-de-vehiculos-330199.html", "text_len": 2875, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "coordinaci\u00f3n con Carabineros de Chile para", "found": true}, {"type": "with", "string": "Tribunal Supremo Disciplinario, teniente", "found": true}, {"type": "with", "string": "por el director nacional de Diprove\u201d.", "found": true}, {"type": "without", "string": "OTRAS NOTICIAS", "found": false}, {"type": "without", "string": "Investigan muerte de un", "found": false}, {"type": "without", "string": "SEGURIDAD", "found": false}]}
{"file": "cybercook.com.br.sequilho.html", "url": "https://cybercook.com.br/receitas/doces/biscoitos-doces/receita-de-sequilho-com-chocolate-amargo-124300", "text_len": 801, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Todos os ingredientes", "found": false}, {"type": "with", "string": "Composi\u00e7\u00e3o nutricional da receita", "found": false}, {"type": "with", "string": "Deixe secar em uma folha de papel", "found": true}, {"type": "without", "string": "Geladinho de Leite em P\u00f3 e", "found": false}, {"type": "without", "string": "Siga o CyberCook", "found": false}, {"type": "without", "string": "Conhe\u00e7a os iogurtes proteicos e inclua-os na sua alimenta\u00e7\u00e3o!", "found": false}]}
{"file": "Rosyjskie zamachy w Czechach - kontekst krajowy, implikacje, perspektywy.html", "url": "https://www.osw.waw.pl/pl/publikacje/analizy/2021-04-20/rosyjskie-zamachy-w-czechach-kontekst-krajowy-implikacje-perspektywy", "text_len": 11036, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "17 kwietnia na konferencji", "found": true}, {"type": "with", "string": "Informacja o nosz\u0105cym", "found": true}, {"type": "with", "string": "Media czeskie i brytyjskie", "found": true}, {"type": "without", "string": "DO WYS\u0141UCHANIA W SERWISIE", "found": false}, {"type": "without", "string": "Mateusz Seroka", "found": false}, {"type": "without", "string": "Publikacje", "found": false}]}
{"file": "bka.de-messengerdienste.html", "url": "https://www.bka.de/DE/Presse/Listenseite_Pressemitteilungen/2022/Presse2022/220126_PM_Telegram.html", "text_len": 1513, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "entwickelt sich nach Einsch\u00e4tzung der", "found": true}, {"type": "with", "string": "BKA gemeinsam mit den Landeskriminal\u00e4mtern", "found": true}, {"type": "with", "string": "Corona-Pandemie hat dazu beigetragen", "found": true}, {"type": "without", "string": "Pressemitteilung als PDF", "found": false}, {"type": "without", "string": "Haben Sie das Gesuchte nicht", "found": false}, {"type": "without", "string": "Neue Taskforce des Bundeskriminalamtes", "found": false}]}
{"file": "sonnenernergie.de.Windrebell.html", "url": "https://www.sonnenenergie.de//index.php?id=30&no_cache=1&tx_ttnews%5Btt_news%5D=477", "text_len": 20218, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "MIT KLEINWINDKRAFT ZU MEHR AUTARKIE:", "found": false}, {"type": "with", "string": "Ebenso wichtig wie die gro\u00dfr\u00e4umige", "found": true}, {"type": "with", "string": "Ob eine Kleinwindenergieanlage", "found": true}, {"type": "without", "string": "Von:", "found": false}, {"type": "without", "string": "Meist gesucht:", "found": false}, {"type": "without", "string": "Copyright 2018 - ", "found": false}]}
{"file": "beige.de.suedfrankreich.html", "url": "https://beige.de/artikel/reisen-travel-provence-suedfrankreich-tipps", "text_len": 6521, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Provence kann etwas,", "found": true}, {"type": "with", "string": "Als wir uns spontan entschieden,", "found": true}, {"type": "with", "string": "Dementsprechend haben wir", "found": true}, {"type": "without", "string": "Die Karte zum Abspeichern:", "found": false}, {"type": "without", "string": "Newsletter", "found": false}, {"type": "without", "string": "Datenschutz", "found": false}]}
{"file": "familie.de.montessori.html", "url": "https://www.familie.de/kleinkind/montessori-spielzeug-13-paedagogisch-wertvolle-ideen-fuer-babys-und-kleinkinder/", "text_len": 6696, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es ist sch\u00f6n, bunt, unkaputtbar.", "found": true}, {"type": "with", "string": "Montessori Spielzeug f\u00f6rdert", "found": true}, {"type": "with", "string": "#3 Nanchen-Pupen", "found": true}, {"type": "without", "string": "Du willst nichts mehr verpassen?", "found": false}, {"type": "without", "string": "Lies auch", "found": false}, {"type": "without", "string": "Teste dich", "found": false}]}
{"file": "erp-news.info.interview.html", "url": "https://erp-news.info/erp-interview-mit-um-digitale-assistenten-und-kuenstliche-intelligenz-ki/", "text_len": 8724, "tp": 3, "fn": 0, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "Einblicke in die Vision zuk\u00fcnftiger", "found": true}, {"type": "with", "string": "Frage 4: Welche Rolle spielt Big Data", "found": true}, {"type": "with", "string": "von The unbelievable Machine Company (*um)", "found": true}, {"type": "without", "string": "Matthias Weber ist ERP-Experte mit langj\u00e4hriger Berufserfahrung.", "found": false}, {"type": "without", "string": "Die Top 5 digitalen Trends f\u00fcr den Mittelstand", "found": false}, {"type": "without", "string": "leading edge", "found": true}, {"type": "without", "string": "Lesen Sie hier einen weiteren", "found": false}]}
{"file": "marktplatz.die-besserwisser.org.zeit.html", "url": "http://marktplatz.die-besserwisser.org/alles-hat-seine-zeit/", "text_len": 1147, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Sie war f\u00fcr uns spannend", "found": true}, {"type": "with", "string": "F\u00fcr einige der Mitglieder", "found": true}, {"type": "with", "string": "Begeisterung ist ansteckend", "found": true}, {"type": "without", "string": "Vorheriger Artikel", "found": false}, {"type": "without", "string": "Marktplatz f\u00fcr ein gutes Leben", "found": false}, {"type": "without", "string": "Leitfaden f\u00fcr den bio-regionalen Einkauf", "found": false}]}
{"file": "litradio.net.bossong.html", "url": "https://litradio.net/die-autorin-nora-bossong-im-gespraech-ueber-ihren-roman-schutzzone/", "text_len": 372, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nora Bossong erz\u00e4hlt von der Arbeit", "found": true}, {"type": "with", "string": "ihre eigene Rolle als UN-Beauftragte", "found": true}, {"type": "with", "string": "Positionierung und Hoffnung in der Desillusion.", "found": true}, {"type": "without", "string": "LANGE NACHT JUNGER LITERATUR UND MUSIK", "found": false}, {"type": "without", "string": "Sharen mit:", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}]}
{"file": "redtri.com.jokes.html", "url": "https://redtri.com/best-jokes-for-kids/slide/1", "text_len": 22837, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "37. What did one volcano say to the other?", "found": true}, {"type": "with", "string": " You look for fresh prints.", "found": false}, {"type": "with", "string": "Kids are natural comedians so why not encourage", "found": false}, {"type": "without", "string": "more stories you may have missed", "found": false}, {"type": "without", "string": "COMPANY INFO", "found": false}, {"type": "without", "string": "AS SEEN IN", "found": false}]}
{"file": "biathlon-antholz.it-jubeln.html", "url": "https://www.biathlon-antholz.it/de/newsroom/23-01-2022-dorothea-wierer-darf-beim-antholz-abschluss-noch-jubeln/17-378.html", "text_len": 5075, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "beim letzten Weltcuprennen schlug", "found": true}, {"type": "with", "string": "Biathlon-Tross pausiert jetzt knapp", "found": true}, {"type": "with", "string": "die trotz Corona, gut verlaufen", "found": true}, {"type": "without", "string": "ZUR\u00dcCK ZUR LISTE", "found": false}, {"type": "without", "string": "MIT FREUNDEN TEILEN", "found": false}, {"type": "without", "string": "DAS K\u00d6NNTE SIE AUCH", "found": false}]}
{"file": "villacc.de.galaxy.html", "url": "http://www.villacc.de/ferienvilla/119/Villa-Galaxy", "text_len": 14803, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In Cape Coral gibt", "found": false}, {"type": "with", "string": "Pool verwendet Salzelektrolyse", "found": false}, {"type": "with", "string": "Jede weitere Person: US $ 100,00", "found": true}, {"type": "without", "string": "oder berechnen Sie die Kosten", "found": false}, {"type": "without", "string": "+49 8670 986823", "found": false}, {"type": "without", "string": "LVCC ist Ihr Partner f\u00fcr die", "found": false}]}
{"file": "d60caba9d12c467b9708ec8981cad8aa.html", "url": "https://www.computerbild.de/artikel/cb-News-Freizeit-Bundesliga-Dortmund-Moenchengladbach-live-sehen-24356155.html", "text_len": 2700, "tp": 2, "fn": 2, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "So sehen Sie das Spiel live", "found": false}, {"type": "with", "string": "dennoch ist die Gladbacher Verletztenliste weiterhin lang", "found": true}, {"type": "with", "string": "\u00bb Zum Angebot: Borussia Dortmund", "found": true}, {"type": "with", "string": "Tipp: Die Sport-App", "found": false}, {"type": "without", "string": "Kein Bild, kein Ton und trotzdem bestens informiert", "found": true}, {"type": "without", "string": " Sehen Sie die Highlights der europ\u00e4ischen Top-Ligen", "found": false}, {"type": "without", "string": "Gef\u00e4llt Ihnen dieser Artikel?", "found": false}, {"type": "without", "string": "Aktuelle Testberichte von Hard- und Software", "found": false}]}
{"file": "archiv.krimiblog.de.2895.html", "url": "http://archiv.krimiblog.de/?p=2895", "text_len": 961, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Okay, hat wieder nichts mit", "found": true}, {"type": "with", "string": "Erg\u00e4nzung 2: Glaubt man", "found": true}, {"type": "with", "string": "Erg\u00e4nzung 1: Den Text des Songs", "found": true}, {"type": "without", "string": "Leider sind keine Kommentare m\u00f6glich.", "found": false}, {"type": "without", "string": "Rasterfahndung", "found": false}, {"type": "without", "string": "Dies ist das Archiv von krimiblog.de", "found": false}]}
{"file": "0af99c85f22b451a93a75bbf99ac412e.html", "url": "https://www.mz-web.de/dessau-rosslau/hingucker-beim-flugplatzfest-zweite-f13-kurz-vor-der-zulassung-33328852", "text_len": 2939, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "entstanden ist er am Flughafen D\u00fcbendorf nahe Z\u00fcrich.", "found": true}, {"type": "with", "string": "Zugleich habe man das Fahrwerk verbessert.", "found": true}, {"type": "with", "string": "dann auch die vierte Maschine gebaut und zugelassen werden.", "found": true}, {"type": "without", "string": "MZ Dessau-Ro\u00dflau bei Facebook", "found": false}, {"type": "without", "string": "polinturner suchen Meister: Stelldichein der deutschen Hoffnungen in Dessau", "found": false}, {"type": "without", "string": "zu die einwandfreie Funktion der Webse", "found": false}]}
{"file": "Koncesjonowana opozycja -Leszek Ja\u017cd\u017cewski - Libert\u00e9!.html", "url": "https://liberte.pl/koncesjonowana-opozycja/", "text_len": 4991, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Pakt lewicy z PiS", "found": true}, {"type": "with", "string": "Podsumujmy. Lewica", "found": true}, {"type": "with", "string": "na salonach w\u0142adzy.", "found": true}, {"type": "without", "string": "Fundusz Odbudowy, lewica, PiS", "found": false}, {"type": "without", "string": "Inne artyku\u0142y autora", "found": false}, {"type": "without", "string": "Polityka prywatno\u015bci", "found": false}]}
{"file": "cducsu.de-wasserstoff.html", "url": "https://www.cducsu.de/themen/wirtschaft-und-energie-verkehr-bildung-und-forschung/gruener-wasserstoff-das-schluesselelement-der-energiewende", "text_len": 3751, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Mark Helfrich \u00fcber das gewaltige", "found": true}, {"type": "with", "string": "Aktuell befinden wir", "found": true}, {"type": "with", "string": "Deutschland einen erheblichen", "found": true}, {"type": "without", "string": "Biokerosin, Verpackungen", "found": true}, {"type": "without", "string": "Quelle: Foto Steven", "found": false}, {"type": "without", "string": "Transfer in die Praxis.", "found": true}]}
{"file": "silkes-weinkeller.de-dekantieren.html", "url": "https://www.silkes-weinkeller.de/weinblatt-magazin/wein-dekantieren/", "text_len": 5755, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "W\u00e4hrend die Trennung vom Depot", "found": true}, {"type": "with", "string": "Die meisten Gef\u00e4\u00dfe bestehen", "found": true}, {"type": "with", "string": " Potenzial, den Genuss", "found": true}, {"type": "without", "string": "Wein zum Spargel:", "found": false}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Inhaltsverzeichnis", "found": true}]}
{"file": "oetv.at-taucher.html", "url": "https://www.oetv.at/news/artikel/d/erfolgreiches-masters-debuet-fuer-taucher-2.html", "text_len": 2021, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Rollstuhlclub ENJO Vorarlberg erneut", "found": false}, {"type": "with", "string": "Nachwuchssportler ging es dabei bereits einige Tage", "found": true}, {"type": "with", "string": "Im Match Tiebreak hatten die Engl\u00e4nder", "found": true}, {"type": "without", "string": "Top Themen der Redaktion", "found": false}, {"type": "without", "string": "Weltspitze der Junioren angekommen. (Foto: Privat)", "found": false}, {"type": "without", "string": "feierte indes in der vergangenen Woche internationale", "found": false}]}
{"file": "cooperativa.cl-presidente.html", "url": "https://www.cooperativa.cl/noticias/pais/presidente-boric/presidente-boric-vuelve-a-su-casa-magallanes-este-miercoles-realiza-su/2022-05-04/074527.html", "text_len": 2683, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Punta Arenas, con las autoridades", "found": true}, {"type": "with", "string": "territorio amigo\", al que represent\u00f3 durante dos", "found": true}, {"type": "with", "string": "Arenas, Boric se desplazar\u00e1 a Puerto", "found": true}, {"type": "without", "string": "Suscr\u00edbete a nuestro newsletter", "found": false}, {"type": "without", "string": "Este sitio est\u00e1 protegido por", "found": false}, {"type": "without", "string": "Foto: ATON", "found": false}]}
{"file": "Lebensmittelpraxis.de-Stadtzentrum.html", "url": "https://lebensmittelpraxis.de/handel-aktuell/38519-olympische-spiele-in-paris-getraenke-per-schiff-ins-stadtzentrum.html", "text_len": 1267, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dazu werden die Getr\u00e4nke per Schiff", "found": true}, {"type": "with", "string": "von einem Lager im Umland zu einem Kai gegen\u00fcber dem Eiffelturm geliefert", "found": true}, {"type": "with", "string": "teilte die Pariser Hafengesellschaft mit", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "Viel gelesen in Handel", "found": false}, {"type": "without", "string": "Supermarkt des Jahres 2023", "found": false}]}
{"file": "prof-pc.de.html", "url": "https://prof-pc.de/", "text_len": 1180, "tp": 3, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "Liebe_r Besucher_in", "found": true}, {"type": "with", "string": "Doch seitdem ist viel Zeit", "found": true}, {"type": "with", "string": "Thanks for All the Fish", "found": true}, {"type": "without", "string": "Datenschutzerkl\u00e4rung", "found": false}]}
{"file": "strangemachines.io.performant.html", "url": "https://strangemachines.io/articles/performant-python", "text_len": 5532, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "There are many ways to improve Python", "found": true}, {"type": "with", "string": "complicated, there are a number of ways ", "found": true}, {"type": "with", "string": "Map and filter are sometimes faster", "found": true}, {"type": "without", "string": "Challenges", "found": false}, {"type": "without", "string": "hello@strangemachines.io", "found": false}, {"type": "without", "string": "06 December 2019", "found": false}]}
{"file": "livenet.ch-sprache.html", "url": "https://www.livenet.ch/themen/gesellschaft/ethik/ethik/398805-von_sprachregeln_genderpolitik_und_ganz_normalem_deutsch.html", "text_len": 8094, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "dem Jakobsweg geschrieben!", "found": true}, {"type": "with", "string": "die Journalistin, ob es", "found": true}, {"type": "with", "string": "\u00fcber Gender-Politik finden", "found": true}, {"type": "without", "string": "The Edge wurde 60", "found": false}, {"type": "without", "string": "Dienstag 30.11.2021 in Baden", "found": false}, {"type": "without", "string": "von Livenet in der", "found": false}]}
{"file": "strive-magazin.de.dating.html", "url": "https://www.strive-magazine.de/post/das-dating-dilemma-erfolgreicher-frauen", "text_len": 5829, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Je erfolgreicher, kl\u00fcger, smarter", "found": true}, {"type": "with", "string": "Oha, steile These, Frau Praetorius!", "found": true}, {"type": "with", "string": "F\u00fcr jene, die damit ein ", "found": true}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Kiosk finden", "found": false}, {"type": "without", "string": "Log In", "found": false}]}
{"file": "dawo-dresden.de-Winterausstellung.html", "url": "https://dawo-dresden.de/2023/10/30/drei-haselnuesse-fuer-aschenbroedel-jetzt-tickets-sichern-fuer-winterausstellung/", "text_len": 1709, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Genau 50 Jahre ist es her", "found": true}, {"type": "with", "string": "das der Film im Januar 1973 in Moritzburg", "found": true}, {"type": "with", "string": "in den Kulissen der Filmstudios Babelsberg", "found": true}, {"type": "without", "string": "Mehr Nachrichten aus Dresden", "found": false}, {"type": "without", "string": "Noch mehr lokale Fundst\u00fccke", "found": false}, {"type": "without", "string": "MEHR AUSFLUGSTIPPS", "found": false}]}
{"file": "auswaertiges-amt.de-Italien.html", "url": "https://www.auswaertiges-amt.de/de/ReiseUndSicherheit/italiensicherheit/211322", "text_len": 33840, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "kann weiterhin zu Einschr\u00e4nkungen", "found": false}, {"type": "with", "string": "Beachten Sie die ausf\u00fchrlichen", "found": true}, {"type": "with", "string": "Besonderheiten in den Regionen", "found": true}, {"type": "without", "string": "Schlagworte", "found": false}, {"type": "without", "string": "Reisewarnungen anl\u00e4sslich", "found": false}, {"type": "without", "string": "Gesellschaftsgruppen. Das Sendeformat", "found": false}]}
{"file": "ladiaria.com.uy-productor.html", "url": "https://ladiaria.com.uy/ambiente/articulo/2022/5/productor-fumigo-con-glifosato-predio-lindero-a-escuela-rural-ubicada-dentro-del-area-protegida-paso-centurion-y-sierra-de-rios/", "text_len": 11271, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "consideran \u201cexcesivo\u201d su tama\u00f1o.", "found": false}, {"type": "with", "string": " Ministerio de Ganader\u00eda, Agricultura y Pesca, autoridad", "found": true}, {"type": "with", "string": "en las zonas rurales lo que pasa muchas veces es que no", "found": true}, {"type": "without", "string": "Comentar este art\u00edculo", "found": false}, {"type": "without", "string": "La asociaci\u00f3n civil de rescate y", "found": false}, {"type": "without", "string": "Predio fumigado lindero a escuela dentro", "found": false}]}
{"file": "90min.de-Bundesliga-Tabelle.html", "url": "https://www.90min.de/posts/bundesliga-tabelle-2023-24-ohne-fehlentscheidungen-01hdgzyyg1b1", "text_len": 2389, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Mittlerweile vergeht kein Wochenende mehr", "found": true}, {"type": "with", "string": "an dem nicht \u00fcber den Schiedsrichter und/oder den VAR diskutiert wird", "found": true}, {"type": "with", "string": "Auch am 10. Spieltag der Bundesliga gab es gleich mehrere strittige Entscheidungen", "found": true}, {"type": "without", "string": "So s\u00e4he die Tabelle der Bundesliga", "found": false}, {"type": "without", "string": "2023/24 nach dem 14. Spieltag ohne Fehlentscheidungen aus", "found": false}, {"type": "without", "string": "Das Fu\u00dfball-Portal wahretabelle.de nimmt strittige", "found": true}]}
{"file": "bettycrocker.com.pineapple.html", "url": "https://www.bettycrocker.com/recipes/easy-pineapple-upside-down-cake/c4d3321d-fad9-41cb-8f29-8d91a4279b07", "text_len": 5917, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "pineapple slices in juice, drained, juice reserved", "found": false}, {"type": "with", "string": "Serve with sweetened whipped cream or an 8-oz", "found": false}, {"type": "with", "string": "warm or cool. Store covered in refrigerator.", "found": true}, {"type": "without", "string": "\u00a9 2020 \u00ae/TM General Mills All Rights Reserved", "found": false}, {"type": "without", "string": "Get kitchen tested recipes, meal ideas and more \u2013 straight to your inbox", "found": false}, {"type": "without", "string": "Most Recent Collections", "found": false}]}
{"file": "mydailymagazine.com.halloween.html", "url": "https://mydailymagazine.com/get-in-the-spooky-spirit-with-these-halloween-workouts/", "text_len": 1194, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Believe it or not, Halloween is just days", "found": true}, {"type": "with", "string": "Kelsey Ellis, is perfect for you. The workout", "found": true}, {"type": "with", "string": "12 reps of each exercise with one to", "found": true}, {"type": "without", "string": "Terms & Conditions", "found": false}, {"type": "without", "string": "Find Beauty in Imperfection with Public Holiday", "found": false}, {"type": "without", "string": "Hot Buttered Rum Cocktail All Season Long", "found": false}]}
{"file": "angelmagazin.de-schmerzen.html", "url": "https://angelmagazin.de/fische-schmerzen/", "text_len": 11271, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "anatomischen Voraussetzungen f\u00fcr ein Schmerzempfinden", "found": true}, {"type": "with", "string": "F\u00e4higkeiten, d. h. sie k\u00f6nnen Umweltinformationen", "found": true}, {"type": "with", "string": "Situation zum Bewusstsein beitragen.", "found": true}, {"type": "without", "string": "\u00dcber den Autor", "found": false}, {"type": "without", "string": "zus\u00e4tzlich noch einen Kaffee ", "found": false}, {"type": "without", "string": "Angeln in Magdeburg", "found": false}]}
{"file": "infosperber.ch-Madagaskar.html", "url": "https://www.infosperber.ch/politik/madagaskar-wo-francafrique-endet/", "text_len": 13396, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der Insel Madagaskar wurde einst", "found": true}, {"type": "with", "string": "eine bl\u00fchende Zukunft vorausgesagt", "found": true}, {"type": "with", "string": "Nun droht das Land wegen Misswirtschaft und Korruption unterzugehen", "found": true}, {"type": "without", "string": "SEIT 10 TAGEN AM MEISTEN GELESEN", "found": false}, {"type": "without", "string": "AKTUELLE DOSSIERS", "found": false}, {"type": "without", "string": "SEIT 10 TAGEN AM MEISTEN REAKTIONEN", "found": false}]}
{"file": "ekhn.de-Pflegefinanzierung.html", "url": "https://www.ekhn.de/aktuell/detailmagazin/news/ekd-papier-fordert-reform-der-pflegefinanzierung.html", "text_len": 2419, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "soziale Ordnung anhand", "found": true}, {"type": "with", "string": "Bew\u00e4hrungstest des Sozialstaates", "found": true}, {"type": "with", "string": "besser bew\u00e4ltigt werden", "found": true}, {"type": "without", "string": "zu diesem Thema", "found": false}, {"type": "without", "string": "Pflege: Diakonie und", "found": false}, {"type": "without", "string": "Gewalt", "found": false}]}
{"file": "heizung.de.waermepumpen.html", "url": "https://www.heizung.de/waermepumpe/wissen/eignet-sich-eine-waermepumpe-im-altbau.html", "text_len": 8873, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "W\u00e4rmepumpenheizungen setzen", "found": true}, {"type": "with", "string": "W\u00e4rmepumpenanlagen gelten als", "found": true}, {"type": "with", "string": "Erreichen l\u00e4sst sich eine niedrige Vorlauftemperatur", "found": true}, {"type": "without", "string": "Mehr zu W\u00e4rmepumpe", "found": false}, {"type": "without", "string": "Neueste Artikel", "found": false}, {"type": "without", "string": "Heizung.de Top Themen", "found": false}]}
{"file": "laweekly.com-Cultivation.html", "url": "https://www.laweekly.com/meet-cultural-cultivation-artist-alexandria-douziech/", "text_len": 5289, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "I try to position plants as storytellers", "found": true}, {"type": "with", "string": "living archives that reflect the legacy of colonialism", "found": true}, {"type": "with", "string": "as well as the power of human resilience", "found": true}, {"type": "without", "string": "SUBSCRIBE TO OUR NEWSLETTER", "found": false}, {"type": "without", "string": "LATEST ARTICLES", "found": false}, {"type": "without", "string": "SEARCH LA WEEKLY", "found": false}]}
{"file": "computerbase.de.htc.html", "url": "https://www.computerbase.de/2007-06/htc-touch-bald-bei-o2-als-xda-nova/", "text_len": 2054, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Vor knapp zwei Wochen", "found": true}, {"type": "with", "string": "gibt es in der dazugeh\u00f6rigen Vorstellungs-News.", "found": true}, {"type": "without", "string": "Themen:", "found": false}, {"type": "without", "string": "bis Januar 2009 Artikel f\u00fcr ComputerBase verfasst.", "found": false}, {"type": "without", "string": "71 Kommentare", "found": false}]}
{"file": "creeny.wordpress.com.nebelsuppe.html", "url": "https://creeny.wordpress.com/2020/01/24/nebelsuppe-6/", "text_len": 644, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "1. Ich glaube, heute m\u00f6chte", "found": true}, {"type": "with", "string": "Gl\u00fccksmomente finden sich", "found": true}, {"type": "with", "string": "leckeren Flammkuchen, morgen", "found": true}, {"type": "without", "string": "Was ich liebe... \u2665", "found": false}, {"type": "without", "string": "Wortspuren hinterlassen", "found": false}, {"type": "without", "string": "\u2665 Gl\u00fccksmomente", "found": false}]}
{"file": "lavazza.de.qualita.html", "url": "https://www.lavazza.de/de/kaffee/gemahlener-kaffee/qualita-oro-250-g.html", "text_len": 333, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Qualit\u00e0 Oro war die erste Lavazza-Mischung", "found": false}, {"type": "with", "string": "Jede Mischung wird meisterhaft zusammengestellt", "found": true}, {"type": "with", "string": "Fruchtige und florale Noten", "found": false}, {"type": "without", "string": "Die Lieferung ist f\u00fcr Sie kostenlos", "found": false}, {"type": "without", "string": "Bitte teilen Sie uns Ihre Erfahrungen", "found": false}, {"type": "without", "string": "Heute empfehlen wir", "found": false}]}
{"file": "changenow.de.loibl.html", "url": "https://changenow.de/andre-loibl/", "text_len": 6823, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "1. Freude und Leichtigkeit.", "found": true}, {"type": "with", "string": "Ich habe ein kurzes Video gemacht", "found": true}, {"type": "with", "string": "offen und neugierig sind", "found": true}, {"type": "without", "string": "Weiter", "found": false}, {"type": "without", "string": "Hier kostenlos anmelden", "found": false}, {"type": "without", "string": "KANGA PROJECT", "found": false}]}
{"file": "die-tagespost.de.Demut.html", "url": "https://www.die-tagespost.de/leben/glauben-wissen/Warum-wir-jetzt-Demut-brauchen;art4886,207643", "text_len": 8918, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "sondern auch politische Ma\u00dfnahmen, wie die zur Bek\u00e4mpfung einer Pandemie", "found": false}, {"type": "with", "string": "In der Tat: Der moderne, s\u00e4kulare Mensch scheint weder Feigheit noch Schw\u00e4che zu kennen.", "found": true}, {"type": "with", "string": "nwirkungen unserer Ma\u00dfnahmen angesichts der SARS-CoV-2 Pandemie in den Blick zu nehmen", "found": true}, {"type": "without", "string": "Weitere Artikel", "found": false}, {"type": "without", "string": "Ihre Meinung zu diesem Thema", "found": false}, {"type": "without", "string": "Triage: Ein medizinethisches Dilemma", "found": false}]}
{"file": "archive.org.stol.it.berlusconi.html", "url": "https://web.archive.org/web/20120216182711/http://www.stol.it/Artikel/Politik-im-Ueberblick/Politik/Verfassungsgericht-Berlusconis-Sex-Prozess-geht-weiter", "text_len": 1780, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das Verfassungsgericht in Rom verwarf am Dienstag einen Antrag", "found": true}, {"type": "with", "string": "Das Argument hatten die Mail\u00e4nder Staatsanw\u00e4lte \u201el\u00e4cherlich\u201c genannt.", "found": true}, {"type": "with", "string": "Das laufende Verfahren gegen den im November als", "found": true}, {"type": "without", "string": "IT 00853870210", "found": false}, {"type": "without", "string": "Hier k\u00f6nnen Sie den Artikel bewerten", "found": false}, {"type": "without", "string": "On-Tour Fotos", "found": false}]}
{"file": "independent.co.uk.penalty.html", "url": "https://www.independent.co.uk/news/uk/politics/coronavirus-false-reporting-contact-fine-penalty-b671230.html", "text_len": 4536, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Anyone falsely naming an antagonist as a coronavirus contact", "found": true}, {"type": "with", "string": "But it is understood that the ban on giving", "found": true}, {"type": "with", "string": "New fines for failure to self-isolate, starting", "found": true}, {"type": "without", "string": "Code of conduct and complaints", "found": false}, {"type": "without", "string": "Share your thoughts and debate the big issues", "found": false}, {"type": "without", "string": "Popular videos", "found": false}]}
{"file": "schimmverband.at-weltmeisterschaft.html", "url": "https://schwimmverband.at/news-artikel tx_news_pi1%5Baction%5D=detail&tx_news_pi1%5Bcontroller%5D=News&tx_news_pi1%5Bnews%5D=2236&cHash=892ac1491204c09aa3b2f080298e0218", "text_len": 2345, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wochen kolportiert wurde, ist", "found": false}, {"type": "with", "string": "verschoben werden m\u00fcssen.", "found": true}, {"type": "with", "string": "M\u00f6glichkeiten f\u00fcr Wettk\u00e4mpfe auf h\u00f6chstem", "found": true}, {"type": "without", "string": "Zur\u00fcck", "found": false}, {"type": "without", "string": "logo", "found": false}, {"type": "without", "string": "powered by", "found": false}]}
{"file": "banyuetan.org.1000200033136171577956287380194268_1.html", "url": "http://www.banyuetan.org/jmcs/detail/20200102/1000200033136171577956287380194268_1.html", "text_len": 1595, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u9ad8\u5ea6\u8ba4\u53ef\u2026\u2026", "found": true}, {"type": "with", "string": "\u53d1\u73b0\u793e\u4f1a", "found": true}, {"type": "with", "string": "\u59da\u52b2\u6ce2\u8bf4\u3002", "found": true}, {"type": "without", "string": "\u70ed\u95e8\u63a8\u8350", "found": false}, {"type": "without", "string": "\u7406\u8bba\u5e94\u8be5", "found": false}, {"type": "without", "string": "\u6742\u5fd7\u56fe\u4e66\u8ba2\u9605", "found": false}]}
{"file": "elcolumbiano.com-alcaldia.html", "url": "https://www.elcolombiano.com/antioquia/polemica-por-buses-de-la-alcaldia-en-casa-de-gustavo-petro-en-la-floresta-EN17385450", "text_len": 5696, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "encenderse esta semana, justo", "found": true}, {"type": "with", "string": "que el pasado 30 de abril los veh\u00edculos", "found": true}, {"type": "with", "string": "una de las cuotas de Quintero en el Pacto Hist\u00f3rico", "found": true}, {"type": "without", "string": "CONTEXTO DE LA NOTICIA", "found": false}, {"type": "without", "string": "ENLACES PATROCINADOS", "found": false}, {"type": "without", "string": "Porque entre varios ojos vemos m\u00e1s, queremos construir", "found": false}]}
{"file": "franceculture.fr.idees.html", "url": "https://www.franceculture.fr/emissions/le-journal-des-idees/le-journal-des-idees-emission-du-mardi-14-janvier-2020", "text_len": 6377, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Performativit\u00e9", "found": true}, {"type": "with", "string": "Les individus productifs communiquent", "found": true}, {"type": "with", "string": "de nos espoirs et de nos d\u00e9sirs.", "found": true}, {"type": "without", "string": "A la tribune je monterai", "found": false}, {"type": "without", "string": "\u00c0 d\u00e9couvrir", "found": false}, {"type": "without", "string": "Le fil culture", "found": false}]}
{"file": "jugend-forscht.de-Feuerl\u00f6schtechnik.html", "url": "https://www.jugend-forscht.de/presse/pressemitteilungen/archiv/neuartige-feuerloeschtechnik-alternative-grillkohle-und-redox-flow-technologie-mint-talente-praesentieren-innovative-ideen.html", "text_len": 3697, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Preistr\u00e4ger von Deutschlands bekanntestem", "found": true}, {"type": "with", "string": "Kern-Brennstoff\u201c ist eine", "found": true}, {"type": "with", "string": "Gesch\u00e4ftsf\u00fchrender Vorstand", "found": true}, {"type": "without", "string": "Folge uns", "found": false}, {"type": "without", "string": "Video: Mehrwert eines Jugend", "found": false}, {"type": "without", "string": "Projektdatenbank", "found": false}]}
{"file": "pocketpc.ch.auslieferung.html", "url": "https://www.pocketpc.ch/windows-phone-7-allgemein/122760-microsoft-beginnt-auslieferung-vorbereitungsupdate-34.html", "text_len": 4141, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "as war noch nicht das Update, sondern nur", "found": true}, {"type": "with", "string": "s auf Ger\u00e4t, Telefon oder Ha", "found": false}, {"type": "with", "string": "hat keine 5 Minuten gedauert, warum denn bei einigen", "found": true}, {"type": "without", "string": "Gewinnspiel: Das neue Quizdue", "found": false}, {"type": "without", "string": "[Apple Pay] und eure Erfahrun", "found": false}, {"type": "without", "string": "Review: InLine BT-POCKET falt", "found": false}]}
{"file": "popsugar.co.uk.halloween.html", "url": "https://www.popsugar.co.uk/smart-living/Cheap-Homemade-Halloween-Costumes-42432483/amp", "text_len": 32968, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "thanks to these genius ideas. This year", "found": true}, {"type": "with", "string": "With a bowler hat, a set of false lashes", "found": true}, {"type": "with", "string": "Long hair or not, you can still pull", "found": true}, {"type": "without", "string": "Send You Push Notifications.", "found": false}, {"type": "without", "string": "POPSUGAR Would Like To ", "found": false}, {"type": "without", "string": "Want More?", "found": false}]}
{"file": "tegernseerstimme.de-Klimavorreiter.html", "url": "https://tegernseerstimme.de/klimavorreiter-oberland-energie-effizienz-netzwerktreffen-in-egling/", "text_len": 3521, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Vertreter der Gemeinden und Fachleute diskutierten", "found": true}, {"type": "with", "string": "auch \u00fcber die sogenannte energieeffiziente", "found": true}, {"type": "with", "string": "welche in Neubaugebieten gut genutzt werden kann", "found": true}, {"type": "without", "string": "Autounfall in St. QuirinAutounfall in St. Quirin", "found": false}, {"type": "without", "string": "MVV-Beitritt bringt Touristen auf die Schienen", "found": false}, {"type": "without", "string": "Diskutieren Sie mit uns", "found": false}]}
{"file": "dvgw.de.heizug.html", "url": "https://www.dvgw.de/blog/gas/welche-heizung-ist-klimafreundlich-und-zukunftstauglich", "text_len": 13049, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In den Heizungen unserer", "found": true}, {"type": "with", "string": "Von den verschiedenen Heizsystemen im Haus", "found": true}, {"type": "with", "string": "Dazu kommt, dass nicht jedes Geb\u00e4ude f\u00fcr", "found": true}, {"type": "without", "string": "Weitere Informationen", "found": false}, {"type": "without", "string": "Ansprechpartner", "found": false}, {"type": "without", "string": "Bleiben Sie auf dem Laufenden", "found": false}]}
{"file": "mitternachtskabinett.wordpress.com.gentrifizierung.html", "url": "https://mitternachtskabinett.wordpress.com/2016/06/19/geister-spuk-gentrifizierung/", "text_len": 1021, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Unser heutiger Gast berichtet von", "found": true}, {"type": "with", "string": "Wie wirkt sich die Gentrifizierung", "found": true}, {"type": "with", "string": "Als Monster der Woche besprechen", "found": true}, {"type": "without", "string": "Gib deine E-Mail-Adresse ein", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Kommentar verfassen", "found": false}]}
{"file": "trails.de.ischgl.html", "url": "https://trails.de/mountainbikeregion/ischgl/", "text_len": 6239, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Ischgl hat sich im Sommer vor allem als Freeride Revier", "found": true}, {"type": "with", "string": "Wer MTB am liebsten bergab betreibt ist in Ischgl in seinem Element", "found": true}, {"type": "with", "string": "hei\u00dfer Tipp f\u00fcr die warmen Monate", "found": true}, {"type": "without", "string": "Bike Hotels", "found": false}, {"type": "without", "string": "Webdesign und alle Inhalte", "found": false}]}
{"file": "bmel.de-zukunftsforum.html", "url": "https://www.bmel.de/DE/themen/laendliche-regionen/zukunftsforum2022.html;jsessionid=ED5DD5866BE5A5FAA71D389A9C6A5802.live922", "text_len": 1239, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "B\u00fcrgerschaftliches Engagement und Ehrenamt", "found": true}, {"type": "with", "string": "Zwei Tage wurde dar\u00fcber diskutiert,", "found": true}, {"type": "with", "string": "Ehrenamtliche in l\u00e4ndlichen Regionen.", "found": true}, {"type": "without", "string": "Gestalten, anstatt zu spalten: Ehrenamtliche", "found": false}, {"type": "without", "string": "Kommission Gleichwertige", "found": false}, {"type": "without", "string": "R\u00fcckblick: Das 14. Zukunftsforum L\u00e4ndliche", "found": false}]}
{"file": "cdu-fraktion-erfurt.de.waldorfschule.html", "url": "http://www.cdu-fraktion-erfurt.de/inhalte/aktuelles/entwicklung-der-waldorfschule-ermoeglicht/index.html", "text_len": 1849, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Ein positives Signal gab", "found": true}, {"type": "with", "string": "der steigenden Nachfrage gerecht zu werden.", "found": true}, {"type": "without", "string": "Zur\u00fcck zur \u00dcbersicht", "found": false}, {"type": "without", "string": "Erh\u00f6hung f\u00fcr Zoo-Eintritt", "found": false}]}
{"file": "blog.gaijinpot.com.chikan.html", "url": "https://blog.gaijinpot.com/tweet-of-the-week-67-dealing-with-chikan/", "text_len": 7515, "tp": 4, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "fear of causing a fuss in public", "found": true}, {"type": "with", "string": "\u78ba\u4fdd\u3059\u308b\u3002", "found": true}, {"type": "with", "string": "help apprehend the culprit.", "found": true}, {"type": "with", "string": "@keizi666", "found": true}, {"type": "without", "string": "Vegan food is notoriously hard", "found": false}, {"type": "without", "string": " 5 min read", "found": false}, {"type": "without", "string": "Student Placement Service", "found": false}]}
{"file": "0a4a8ab61c054192b1ec70cc3570cf45.html", "url": "https://www.zugreiseblog.de/db-lounge-zutritt-sparpreis/", "text_len": 4671, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Die Deutsche Bahn streicht den Zutritt zu ihrer DB Lounge", "found": true}, {"type": "with", "string": "Die Deutsche Bahn \u00e4ndert zum Fahrplanwechsel", "found": true}, {"type": "with", "string": "Neues gastronomisches Konzept", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Dich auch interessieren", "found": false}, {"type": "without", "string": "Sder Gr\u00fcnder des Zugreiseblog", "found": false}, {"type": "without", "string": "Erfahre zudem,", "found": false}, {"type": "without", "string": "Mit meinem kostenlosen Newsletter verpasst", "found": false}]}
{"file": "bdzv.de.eliasson.html", "url": "https://www.bdzv.de/nachrichten-und-service/presse/pressemitteilungen/artikel/detail/olafur-eliasson-gestaltet-titelseite-fuer-die-deutschen-zeitungen/", "text_len": 2724, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "esichts der Corona-Krise und ihrer Folgen f\u00fcr die Gesellschaft ist das Thema ", "found": true}, {"type": "with", "string": "effpunkt von Journalist, Text und Leser fokussiert. Das Werk entstan", "found": true}, {"type": "with", "string": "rall auf der Welt das Recht haben muss, frei und ohne Angst berichten zu k\u00f6nnen.", "found": true}, {"type": "without", "string": "zur\u00fcck", "found": false}, {"type": "without", "string": "nach oben", "found": false}, {"type": "without", "string": "English", "found": false}]}
{"file": "petri-heil-ch-hechte.html", "url": "https://www.petri-heil.ch/de/bielerseewinterhechte--1026", "text_len": 6648, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "untersch\u00e4tzter Zielfisch in der Schweiz", "found": true}, {"type": "with", "string": "kalten Jahreszeit im Revier", "found": true}, {"type": "with", "string": "kr\u00e4ftezehrend hochgedrillt werden", "found": true}, {"type": "without", "string": "Keine Kommentare", "found": true}, {"type": "without", "string": "Faszination Bass", "found": false}, {"type": "without", "string": "Unterwasser Angriff", "found": false}]}
{"file": "de.starsinsider.com-Angst.html", "url": "https://de.starsinsider.com/gesundheit/588409/this-is-what-happens-to-your-brain-and-body-when-you-get-scared", "text_len": 6454, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Angst ist ein unausweichlicher Bestandteil", "found": true}, {"type": "with", "string": "der menschlichen Erfahrung", "found": true}, {"type": "with", "string": "Obwohl sie in der Regel als eine unerw\u00fcnschte Emotion", "found": true}, {"type": "without", "string": "MEIST GELESEN", "found": false}, {"type": "without", "string": "F\u00dcR DICH EMPFOHLEN", "found": false}, {"type": "without", "string": "Wie gef\u00e4hrlich ist Scharlach?", "found": false}]}
{"file": "landwirt.com.sensortechnik.html", "url": "https://www.landwirt.com/Precision-Farming-Moderne-Sensortechnik-im-Kuhstall,,4229,,Bericht.html", "text_len": 4027, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "b) \u00dcberwachung der somatischen Zellen", "found": true}, {"type": "with", "string": "Wiederkauverhalten und Kotkonsistenz.", "found": true}, {"type": "with", "string": "K\u00f6llitsch (D)", "found": true}, {"type": "without", "string": "Anzeigentarife", "found": false}, {"type": "without", "string": "weiterempfehlen", "found": false}, {"type": "without", "string": "New Holland T6050", "found": false}, {"type": "without", "string": "Aktuelle Berichte aus dieser Kategorie", "found": false}]}
{"file": "ekbo.de-Bischofs.html", "url": "https://www.ekbo.de/themen/detail/nachricht/bischofswort.html", "text_len": 3303, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "zur Er\u00f6ffnung der Schlo\u00dfkirche", "found": true}, {"type": "with", "string": "Bei der Erweiterung", "found": true}, {"type": "with", "string": "\u201eWir sind Kirche mit Gefl\u00fcchteten", "found": true}, {"type": "without", "string": "\u00c4hnliche Nachrichten", "found": false}, {"type": "without", "string": "Livestream der Synode", "found": false}, {"type": "without", "string": "Wort des Bischofs zur Herbstsynode", "found": false}]}
{"file": "golf.de-augusta.html", "url": "https://www.golf.de/i7484_1.html", "text_len": 9903, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Weg dorthin war f\u00fcr den in Dallas geborenen", "found": true}, {"type": "with", "string": "Blickt man auf Elders Werdegang", "found": true}, {"type": "with", "string": "Zocker und Wettliebhaber arbeitete", "found": true}, {"type": "without", "string": "Nicklaus \u2013 Mann der gro\u00dfen Worte", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "Augusta National/Getty Images", "found": false}]}
{"file": "bloghaus.hypotheses.org.2320.html", "url": "https://bloghaus.hypotheses.org/2320", "text_len": 1620, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Um Sichtbarkeit und Leserschaft", "found": true}, {"type": "with", "string": "In diesem Blogbeitrag zeigen wir", "found": true}, {"type": "with", "string": "Und so sieht das bei uns im Redaktionsblog aus", "found": true}, {"type": "without", "string": "Ein Blog pr\u00e4sentiert von Hypotheses", "found": false}, {"type": "without", "string": "Dieses Blog gibt Hilfestellung", "found": false}, {"type": "without", "string": "Bloghaus in anderen Sprachen", "found": false}]}
{"file": "tdg.ch.chlorothalonil.html", "url": "https://www.tdg.ch/suisse/berne-interdit-chlorothalonil/story/18348200", "text_len": 5251, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Le chlorothalonil sera interdit", "found": true}, {"type": "with", "string": "Le chlorothalonil est une substance active utilis\u00e9e", "found": true}, {"type": "with", "string": "Les Suisses pourraient \u00e9galement se prononcer sur", "found": true}, {"type": "without", "string": "Avez-vous appr\u00e9ci\u00e9 cet article?", "found": false}, {"type": "without", "string": "Plus de sujets", "found": false}, {"type": "without", "string": "Le canton de Berne veut interdire le chlorothalonil ", "found": false}]}
{"file": "focus.de.leasen.html", "url": "https://www.focus.de/auto/experten/auto-leasen-oder-kaufen-fuer-wen-lohnt-sich-was_id_9209161.html", "text_len": 6494, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "FOCUS-Online-Experte Robin Tsch\u00f6pe hat sie verglichen.", "found": true}, {"type": "with", "string": "Mit einem Schlag ist d", "found": true}, {"type": "with", "string": "Wer es gerne flexibel mag", "found": true}, {"type": "without", "string": "Bitte loggen Sie sich vor dem Kommentieren ein", "found": false}, {"type": "without", "string": "\u201eExperten\u201c abonnieren", "found": false}, {"type": "without", "string": "Pers\u00f6nlicher Newsletter", "found": false}]}
{"file": "Ile jest warta godzina pracy_ W tych krajach praca pop\u0142aca - Forsal.pl.html", "url": "https://forsal.pl/gospodarka/pkb/artykuly/8150873,ile-jest-warta-godzina-pracy.html", "text_len": 995, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Portal Statista powo\u0142uje", "found": true}, {"type": "with", "string": "54,4 dolara.", "found": true}, {"type": "with", "string": "Oto kraje, w", "found": true}, {"type": "without", "string": "ShutterStock", "found": false}, {"type": "without", "string": "Ten tekst przeczytasz", "found": true}, {"type": "without", "string": "\u0179r\u00f3d\u0142o:", "found": false}]}
{"file": "alacarte.at-purzelbaum.html", "url": "https://www.alacarte.at/reisen/der-historische-purzelbaum-20215/", "text_len": 20403, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Leipzig war, widerfuhr mir etwas Merkw\u00fcrdiges", "found": true}, {"type": "with", "string": "Menschen umfassende Saal bis auf", "found": true}, {"type": "with", "string": "anderswo kennengelernt hatte, und", "found": true}, {"type": "without", "string": "Milchbar Pinguin", "found": true}, {"type": "without", "string": "In Auerbachs Keller tafelten Faust und Mephisto", "found": false}, {"type": "without", "string": "SHARE", "found": false}]}
{"file": "bmjv.de.konsum.html", "url": "https://www.bmjv.de/DE/Verbraucherportal/KonsumImAlltag/TransparenzPreisanpassung/TransparenzPreisanpassung_node.html", "text_len": 12668, "tp": 3, "fn": 0, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "Auch hier gilt der Grundsatz,", "found": true}, {"type": "with", "string": "Anbieter von Fernw\u00e4rme haben innerhalb ihres Leitungsnetzes ein Monopol", "found": true}, {"type": "with", "string": "(Billigkeitskontrolle nach \u00a7 315 BGB)", "found": true}, {"type": "without", "string": "Impressum", "found": false}, {"type": "without", "string": "Weitere Informationen", "found": false}, {"type": "without", "string": "Transparenz bei Preisanpassungen", "found": true}, {"type": "without", "string": "Twitter", "found": false}]}
{"file": "backenmachtgluecklich.de.zitronenkuchen.html", "url": "https://www.backenmachtgluecklich.de/rezepte/saftiger-zitronenkuchen-vom-blech.html", "text_len": 5049, "tp": 6, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "einen echten Klassiker aus der Backstube.", "found": true}, {"type": "with", "string": "Sobald der Kuchen gebacken", "found": true}, {"type": "with", "string": "Diesen Beitrag habe ich 2017", "found": true}, {"type": "with", "string": "6 mittelgro\u00dfe Eier", "found": true}, {"type": "with", "string": "R\u00fchrteig auf dem Blech verteilen", "found": true}, {"type": "with", "string": "Du m\u00f6chtest Zutaten ersetzen?", "found": true}, {"type": "without", "string": "Pinnen", "found": false}, {"type": "without", "string": "Rezept drucken", "found": false}, {"type": "without", "string": "Zudem erh\u00e4ltst du jede Woche", "found": false}, {"type": "without", "string": "Hallo, ich bin Foodbloggerin", "found": false}]}
{"file": "legrandcontinent.eu.heran.html", "url": "https://legrandcontinent.eu/fr/2020/03/02/francois-heran/", "text_len": 10955, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "certes beaucoup de migrants, mais c\u2019est un flux massif continu.", "found": true}, {"type": "with", "string": "il faut avoir d\u00e9j\u00e0 les ressources, savoir d\u00e9j\u00e0", "found": true}, {"type": "with", "string": "la justice spatiale est un des objectifs de l\u2019Union, alors Dublin n\u2019est pas acceptable", "found": true}, {"type": "without", "string": "Pour approfondir", "found": false}, {"type": "without", "string": "concepts li\u00e9s \u00e0 l", "found": false}, {"type": "without", "string": "Coronavirus, un t\u00e9moignage du front", "found": false}]}
{"file": "haus.de-Vorsatzschallung.html", "url": "https://www.haus.de/bauen/vorsatzschalung-33656", "text_len": 6083, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "vor allem in der Trockenbauweise", "found": false}, {"type": "with", "string": "Zwischen den beiden Elementen", "found": true}, {"type": "with", "string": "Schallschutz sorgen. Bei der direkt befestigten", "found": true}, {"type": "without", "string": "H\u00c4UFIG GESTELLTE FRAGEN", "found": false}, {"type": "without", "string": "Wirkt eine Vorsatzschalung als Dampfbremse?", "found": false}, {"type": "without", "string": "Schallschutz sowie die W\u00e4rmeisolierung.", "found": true}]}
{"file": "eurosport.de-corona.html", "url": "https://www.eurosport.de/olympia/olympia-2022-in-peking/2022/olympia-2022-zweiter-coronafall-deutschen-team-aufregung-thomas-weikert-vorganger-attackiert_sto8749554/story.shtml", "text_len": 3573, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Alfons H\u00f6rmann seinen Nachfolger Thomas", "found": false}, {"type": "with", "string": "die Defensive. Kurz vor der Er\u00f6ffnungsfeier", "found": true}, {"type": "with", "string": "Athlet oder Betreuer, sitzt symptomfrei mit einem", "found": true}, {"type": "without", "string": "LETZTE NEWS", "found": false}, {"type": "without", "string": "DOLL \"BEIM ERSTEN MAL LOCKERER\"", "found": false}, {"type": "without", "string": "N\u00c4CHSTES DEUTSCHES TEAMMITGLIED", "found": false}]}
{"file": "handball-word.news-nationalspiel.html", "url": "https://www.handball-world.news/o.red.r/news-1-1-1-139353.html", "text_len": 3885, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Jahre zum Handball Sport", "found": false}, {"type": "with", "string": "Lippe und die SG Flensburg-Handewitt", "found": false}, {"type": "with", "string": "Erinnerungen an Hamburg", "found": false}, {"type": "without", "string": "Eine Tasse davon", "found": false}, {"type": "without", "string": "nimmt...", "found": false}, {"type": "without", "string": "\"Waren vier", "found": false}]}
{"file": "thenervousbreakdown.com.loneliest.html", "url": "http://thenervousbreakdown.com/tanderson/2011/07/the-loneliest-woman-in-the-world-an-appreciation-of-hearts-alone/", "text_len": 5762, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Fans of Heart, the rawk band", "found": true}, {"type": "with", "string": "I stayed, because Ann was really about to deliver", "found": true}, {"type": "with", "string": "And of course they did get through it.", "found": true}, {"type": "without", "string": "Leave a Reply", "found": false}, {"type": "without", "string": "responses to \u201cThe Loneliest Woman in", "found": false}, {"type": "without", "string": "TIM ANDERSON has done many amazing things in his short life.", "found": false}]}
{"file": "sibenlab.blogspot.com.privacy.html", "url": "http://sibenlab.blogspot.com/2018/06/sibenlab-privacy-policy.html", "text_len": 10337, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "This privacy policy has been compiled to", "found": true}, {"type": "with", "string": "If at any time you would like to", "found": true}, {"type": "with", "string": "visiting the Google Ad and Content Network privacy", "found": true}, {"type": "without", "string": "Th\u00e8me Simple. Fourni par", "found": false}, {"type": "without", "string": "Inscription \u00e0", "found": false}, {"type": "without", "string": "Publier un commentaire", "found": false}]}
{"file": "japantimes.co.jp.surgical.html", "url": "https://www.japantimes.co.jp/news/2020/02/18/national/crime-legal/6000-surgical-masks-stolen/", "text_len": 870, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The incident has occurred at a time when Japan is seeing a shortage of face masks", "found": true}, {"type": "with", "string": "Four of the 12 boxes of masks were gone", "found": true}, {"type": "with", "string": "KOBE \u2013 A total of 6,000 surgical masks", "found": true}, {"type": "without", "string": "Do masks offer protection from new coronavirus? It depends", "found": false}, {"type": "without", "string": "Mail the editor", "found": false}, {"type": "without", "string": "RELATED STORIES", "found": false}]}
{"file": "caritas.de-Pr\u00e4sidentin.html", "url": "https://www.caritas.de/presse/pressemeldungen-dcv/eva-welskop-deffaa-zur-neuen-caritas-praesidentin-gewaehlt-7fc83ad4-6508-4c79-adba-8a0fee82a677", "text_len": 1795, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Digitale Agenda des Verbande", "found": true}, {"type": "with", "string": "\u201eDie T\u00fcren der Kirche von innen aufsto\u00dfen\u201c", "found": true}, {"type": "with", "string": "18 Jahren als Caritas-Pr\u00e4sident", "found": true}, {"type": "without", "string": "Pressesprecherin des", "found": false}, {"type": "without", "string": "Berliner B\u00fcro \u2013 Pressestelle", "found": false}, {"type": "without", "string": "DCV / Oppitz", "found": false}]}
{"file": "kirche-und-leben.de-M\u00fcnster.html", "url": "https://www.kirche-und-leben.de/artikel/muensters-caritas-chef-kessmann-ist-gegen-impfpflicht-in-der-pflege", "text_len": 2730, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Impfpflicht f\u00fcr die Pflege", "found": false}, {"type": "with", "string": "Impfquoten mit zwischen", "found": true}, {"type": "with", "string": "komme es trotz hohen", "found": true}, {"type": "without", "string": "Die Ignoranz der", "found": false}, {"type": "without", "string": "k\u00f6nnen entscheiden", "found": false}, {"type": "without", "string": "auf Corona-Tests vor", "found": false}]}
{"file": "www.dhb.de-regionallehrgang.html", "url": "https://www.dhb.de/de/redaktionsbaum/nationalteams/a-frauen/erneuter-verzicht-auf-regionallehrgang-/", "text_len": 748, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "im M\u00e4rz beginnen. Teil der Ma\u00dfnahme", "found": true}, {"type": "with", "string": "HBF und Liga k\u00f6nnen die freigewordenen", "found": true}, {"type": "with", "string": "Nationalmannschaft im M\u00e4rz mit", "found": false}, {"type": "without", "string": "NEWS", "found": false}, {"type": "without", "string": "Foto: Sascha Klahn", "found": false}, {"type": "without", "string": "A-FRAUEN", "found": false}]}
{"file": "oekologisch-bauen.info.energieeffizienz.html", "url": "https://www.oekologisch-bauen.info/haustechnik/elektro-fotovoltaik/initiative-energieeffizienz/", "text_len": 2169, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mit der Initiative EnergieEffizienz", "found": true}, {"type": "with", "string": "Der Stromcheck", "found": true}, {"type": "with", "string": "Weitere Informationen rund um das Thema", "found": true}, {"type": "without", "string": "RATGEBER FIRMEN NEWS FORUM", "found": false}, {"type": "without", "string": "KURZ NOTIERT", "found": false}, {"type": "without", "string": "Impressum", "found": false}]}
{"file": "zulang.wordpress.com.genitalverstuemmelung.html", "url": "https://zulang.wordpress.com/2015/12/12/3-jahre-legalisierte-genitalverstuemmelung/", "text_len": 8672, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Einen ausf\u00fchrlichen Einstieg", "found": true}, {"type": "with", "string": "Bef\u00fcrworter der Beschneidung bagatellisieren", "found": true}, {"type": "with", "string": "Dem l\u00e4sst sich kaum etwas hinzuf\u00fcgen", "found": true}, {"type": "without", "string": "Die Kommentarfunktion ist geschlossen", "found": false}, {"type": "without", "string": "Share this:", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}]}
{"file": "zoll.de-Tabaksteuer.html", "url": "https://www.zoll.de/SharedDocs/Fachmeldungen/Aktuelle-Einzelmeldungen/2021/vst_verkuendung_tabaksteuermodernisierungsgesetz.html", "text_len": 1759, "tp": 3, "fn": 0, "fp": 2, "tn": 2, "details": [{"type": "with", "string": "f\u00fcr Substitute f\u00fcr Tabakwaren.", "found": true}, {"type": "with", "string": "1. Januar 2023", "found": true}, {"type": "with", "string": "Beteiligte, die erstmals", "found": true}, {"type": "without", "string": "(Fachthemen)", "found": true}, {"type": "without", "string": "Wie gef\u00e4llt Ihnen unsere", "found": false}, {"type": "without", "string": "Weitere Informationen", "found": false}, {"type": "without", "string": "PDF", "found": true}]}
{"file": "netzpolitik.org.abmahnungen.html", "url": "https://netzpolitik.org/2016/die-cider-connection-abmahnungen-gegen-nutzer-von-creative-commons-bildern/", "text_len": 12357, "tp": 3, "fn": 1, "fp": 0, "tn": 5, "details": [{"type": "with", "string": "Seit Dezember 2015", "found": false}, {"type": "with", "string": "VSGE", "found": true}, {"type": "with", "string": "Dazu muss das \u00fcberholte Urheberrecht", "found": true}, {"type": "with", "string": "Dieser Artikel baut auf einer gemeinsamen Recherche", "found": true}, {"type": "without", "string": "23.06.2016", "found": false}, {"type": "without", "string": "Zum Vergr\u00f6\u00dfern auf das Bild", "found": false}, {"type": "without", "string": "Markus Reuter besch\u00e4ftigt sich", "found": false}, {"type": "without", "string": "Ist Video\u00fcberwachung beim Zahnarzt", "found": false}, {"type": "without", "string": "Wir sind spendenfinanziert.", "found": false}]}
{"file": "d44c5ef50718437984dca47627dee96b.html", "url": "https://appen.com/blog/artificial-intelligence-and-machine-learning-industry-news-ai-in-patient-care-and-operations-ai-as-a-preventive-tool-and-how-major-hospitals-are-already-using-ai/", "text_len": 5885, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Follow us to stay up to date on industry trends.", "found": true}, {"type": "with", "string": "How Major Hospitals are Already Using AI", "found": true}, {"type": "with", "string": "With predictive analytics,", "found": true}, {"type": "without", "string": "Trending Posts", "found": false}, {"type": "without", "string": "Subscribe to email updates", "found": false}, {"type": "without", "string": "Receive our monthly newsletter", "found": false}]}
{"file": "dailymail.co.uk.food.html", "url": "https://www.dailymail.co.uk/news/article-8772683/Chef-Jamie-Oliver-joins-Mail-Sundays-war-toxic-food.html", "text_len": 36696, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "A powerful alliance of chefs, celebrities and charities", "found": true}, {"type": "with", "string": " would also help secure the goal set out so", "found": true}, {"type": "with", "string": "Even George Eustice, the current Environment Secretary", "found": true}, {"type": "without", "string": "As many as a million young people", "found": false}, {"type": "without", "string": "The letter also argues that 'the British public", "found": true}, {"type": "without", "string": "As things stand the Government is telling Tory MP", "found": true}]}
{"file": "berkutschi.com-willingen.html", "url": "https://berkutschi.com/de/front/news/10759-marius-lindvik-gewinnt-in-willingen", "text_len": 2456, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "und dem Slowenen Cene Prevc durch", "found": true}, {"type": "with", "string": "zu den Top-Favoriten auf Olympisches", "found": true}, {"type": "with", "string": "Olympischen Spiele am", "found": true}, {"type": "without", "string": "Wettkampfdaten", "found": false}, {"type": "without", "string": "Weltcup Herren", "found": false}, {"type": "without", "string": "Weitester Sprung", "found": false}]}
{"file": "unzensuriert.at-Zeche.html", "url": "https://unzensuriert.at/209302-von-der-leyen-will-kriegsland-ukraine-in-eu-holen-oesterreich-zahlt-die-zeche/", "text_len": 2459, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Aussage von EU-Kommissionspr\u00e4sidentin Ursula von der Leyen", "found": true}, {"type": "with", "string": "dass die Ukraine den Weg f\u00fcr Beitrittsgespr\u00e4che fast geschafft h\u00e4tte", "found": true}, {"type": "with", "string": "l\u00e4sst bei FP\u00d6-Europasprecherin Petra Steger die Alarmglocken l\u00e4uten.", "found": true}, {"type": "without", "string": "Alle Politik-Artikel lesen", "found": false}, {"type": "without", "string": "Bidens Bruder teilt trotz Freundin...", "found": false}, {"type": "without", "string": "Wenn Sie dieses Youtube-Video sehen m\u00f6chten, m\u00fcssen Sie die externen YouTube-cookies akzeptieren.", "found": false}]}
{"file": "chip.de.beef.html", "url": "https://www.chip.de/test/Beef-Maker-von-Aldi-im-Test_154632771.html", "text_len": 7071, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Starke Hitze nur in der Mitte", "found": true}, {"type": "with", "string": "ca. 35,7\u00d729,4 cm", "found": true}, {"type": "with", "string": "Wir sind im Steak-Himmel!", "found": true}, {"type": "without", "string": "Samsung Galaxy S10 128GB", "found": false}, {"type": "without", "string": "F\u00fcr Links auf dieser Seite", "found": false}, {"type": "without", "string": "Inga Buller ist Head of Social", "found": true}]}
{"file": "chorknaben-ulm.de.geschichte.html", "url": "https://www.chorknaben-ulm.de/geschichte.html", "text_len": 1546, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "1968 bis heute Knabenmusik", "found": true}, {"type": "with", "string": "Der Chor wird durch den 1978", "found": true}, {"type": "with", "string": "973 \u00fcbernahm der damals", "found": true}, {"type": "without", "string": "Seit 50 Jahren sind wir", "found": false}, {"type": "without", "string": "Leitung: Thomas Stang", "found": false}, {"type": "without", "string": "Impressum & Datenschutz", "found": false}]}
{"file": "eatsmarter.de.porridge.html", "url": "https://eatsmarter.de/rezepte/vanille-hafer-porridge-mit-leinsamen-und-apfel", "text_len": 2190, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Haferdrink mit Haferflocken, Vanille und Zimt, Leinsamen", "found": true}, {"type": "with", "string": "N\u00fcsse trocken in einer Pfanne anr\u00f6sten. \u00c4pfel waschen", "found": true}, {"type": "with", "string": "Hafer ist reich an Ballaststoffen und Calcium. Insbesondere der Quellstoff", "found": true}, {"type": "without", "string": "und Beauty. Erfahren Sie hier alles \u00fcber die Kooperation.", "found": false}, {"type": "without", "string": "Eine runde Sache also, wie Sie in dieser Warenkunde erfahren! ", "found": false}, {"type": "without", "string": "Di\u00e4trezepte unter 400 Kcal", "found": false}]}
{"file": "vinosytapas.de.rioja.html", "url": "https://www.vinosytapas.de/wein/herkunft/spanien/d_o_ca_-rioja/", "text_len": 1526, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Bestimmungen der D.O.Ca.", "found": false}, {"type": "with", "string": "F\u00fcr die Qualit\u00e4tsstufen der Weine", "found": false}, {"type": "with", "string": "Mindestlagerzeit Rotwein", "found": true}, {"type": "without", "string": "Es werden die Weine 1 bis 10 von insgesamt 19 angezeigt!", "found": false}, {"type": "without", "string": "Ihr Warenkorb ist leer", "found": false}, {"type": "without", "string": "Patanegra-Schinken aus ", "found": false}]}
{"file": "0ac0531f1f0543f4a3f68159e5fd1875.html", "url": "https://www.dealdoktor.de/user-deals/deals/gutscheine-deals/jacobs-gold-instant-kaffee-2-glaeser-fuer-480-e/", "text_len": 722, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bei einsendung des Kassenbons", "found": true}, {"type": "with", "string": "4. 6 \u20ac Gutschein f\u00fcr den Einkauf bei Edeka erhalten.", "found": true}, {"type": "with", "string": "Einsendeschluss: 03.11.2019 (Poststempel)", "found": true}, {"type": "without", "string": "Deal abgelaufen? Jetzt melden!", "found": false}, {"type": "without", "string": "Kostenlos zum Newsletter anmelden und", "found": false}, {"type": "without", "string": "Du musst angemeldet sein, um einen Kommentar abzugeben.", "found": false}]}
{"file": "stylegart.de.naturkosmetik.html", "url": "https://www.stylegart.de/naturkosmetik-doch-gesuender/", "text_len": 4556, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wer meine Instastorys flei\u00dfig verfolgt, der wei\u00df, dass ich", "found": true}, {"type": "with", "string": "Tuben und Tiegel mit nat\u00fcrlichen Verpackungen, meist mit Bl\u00fctenprints umrankt versprechen ", "found": true}, {"type": "with", "string": "Dr. Scheller und Lavera, die nat\u00fcrliche Kosmetika zu fairen Preisen anbieten!", "found": true}, {"type": "without", "string": "Was dich erwartet", "found": false}, {"type": "without", "string": "Datenschutzerkl\u00e4rung", "found": false}, {"type": "without", "string": "Vorher-Nachher", "found": false}]}
{"file": "l-mag.de-Holocaust-Gedenken.html", "url": "https://www.l-mag.de/news-1010/holocaust-gedenktag-lesbische-erinnerungskultur-mit-stolpersteinverlegung.html?L=422", "text_len": 3626, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Deutschland waren queere Opfer", "found": true}, {"type": "with", "string": "Mit der Wahl von Dr. Hertha Kraus", "found": true}, {"type": "with", "string": "international an der Integration von", "found": true}, {"type": "without", "string": "Weiterlesen:", "found": false}, {"type": "without", "string": "Die aktuelle Ausgabe der L-MAG", "found": true}, {"type": "without", "string": " von den Wirtschaftsweibern", "found": false}]}
{"file": "battery-news.de.ultium-cells.html", "url": "https://battery-news.de/index.php/2022/12/06/ultium-cells-erhoeht-gigafactory-kapazitaet-in-tennessee/", "text_len": 1630, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ultium Cells investiert", "found": true}, {"type": "with", "string": "Weitere US-Zellprojekte im Aufbau", "found": true}, {"type": "with", "string": "Gesamtvolumen \u00fcber 130 Gigawattstunden", "found": true}, {"type": "without", "string": "Artikel teilen", "found": false}, {"type": "without", "string": "SUCHE", "found": false}, {"type": "without", "string": "NEUESTE BEITR\u00c4GE", "found": false}]}
{"file": "eldeber.com.bo-autos.html", "url": "https://eldeber.com.bo/santa-cruz/investigador-chileno-asegura-que-no-publico-todo-su-material-el-90-de-los-autos-robados-estan-en-pos_276757", "text_len": 3079, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "coronel Ra\u00fal Cabezas Pantoja,", "found": true}, {"type": "with", "string": "recuperaci\u00f3n de la vagoneta. Coment\u00f3", "found": true}, {"type": "with", "string": "devolver los veh\u00edculos.", "found": true}, {"type": "without", "string": "Recomendado para ti", "found": false}, {"type": "without", "string": "ESCUCHA ESTA NOTA AQU\u00cd", "found": false}, {"type": "without", "string": "TE PUEDE INTERESAR", "found": false}]}
{"file": "telemedicus.info.rezension.html", "url": "https://www.telemedicus.info/article/2766-Rezension-Haerting-Internetrecht,-5.-Auflage-2014.html", "text_len": 3728, "tp": 2, "fn": 0, "fp": 0, "tn": 5, "details": [{"type": "with", "string": "Aufbau und Inhalt", "found": true}, {"type": "with", "string": "Verlag Dr. Otto Schmidt", "found": true}, {"type": "without", "string": "Anzeige:", "found": false}, {"type": "without", "string": "Handbuch", "found": false}, {"type": "without", "string": "Drucken", "found": false}, {"type": "without", "string": "\u00c4hnliche Artikel", "found": false}, {"type": "without", "string": "Kommentar schreiben", "found": false}]}
{"file": "feuerwehrtaucher-oldenburg.de.ausbildung.html", "url": "http://feuerwehrtaucher-oldenburg.de/bootsdienst/ausbildung.html", "text_len": 1197, "tp": 3, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "Die Bootsf\u00fchrerausbildung in der Feuerwehr", "found": true}, {"type": "with", "string": "Wichtig ist die F\u00e4higkeit, eine", "found": true}, {"type": "with", "string": "Auch das slippen der Boote an", "found": true}, {"type": "without", "string": "Rettungsschwimmen", "found": false}]}
{"file": "d76bb5cda4cd4621a04c1b166d6cad9f.html", "url": "https://www.tag24.de/nachrichten/rostow-russland-fuenf-kinder-und-zwei-erwachsene-sterben-bei-schrecklichem-wohnhausbrand-1255262", "text_len": 819, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "als sich das Feuer im Treppenhaus ausbreitete", "found": true}, {"type": "with", "string": "Dachgeschoss brannte vollkommen aus.", "found": true}, {"type": "with", "string": "ob der Brand wegen eines defekten Elektroger\u00e4tes", "found": true}, {"type": "without", "string": "Letzter Auftritt bei", "found": false}, {"type": "without", "string": "FAMILIENDRAMA: MUTTER", "found": false}, {"type": "without", "string": "Wir bei WhatsApp", "found": false}]}
{"file": "Kr\u00f3lowa El\u017cbieta wyp\u0142ywa w \u015bwiat. Sygna\u0142 dla Chin i Rosji - Polityka.pl.html", "url": "https://www.polityka.pl/tygodnikpolityka/swiat/2116825,1,krolowa-elzbieta-wyplywa-w-swiat-sygnal-dla-chin-i-rosji.read", "text_len": 15104, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Pierwszy rejs HMS", "found": true}, {"type": "with", "string": "Bandera pod\u0105\u017ca za handlem", "found": true}, {"type": "with", "string": "zawa\u017cy\u0142a na jego trasie.", "found": true}, {"type": "without", "string": "Czytaj te\u017c", "found": true}, {"type": "without", "string": "By\u0142y dow\u00f3dca wojsk USA", "found": true}, {"type": "without", "string": "starszy analityk", "found": false}]}
{"file": "dbjr.de.bundespraesident.html", "url": "https://www.dbjr.de/artikel/bundespraesident-wuerdigte-das-ehrenamtliche-engagement/", "text_len": 1079, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Steinmeier l\u00e4dt jedes Jahr", "found": false}, {"type": "with", "string": "Zum Empfang kamen", "found": true}, {"type": "with", "string": "Er bat darum", "found": true}, {"type": "without", "string": "10178 Berlin", "found": false}, {"type": "without", "string": "Themen: Ehrenamt Jugendverb\u00e4nde", "found": false}, {"type": "without", "string": "Datenschutz", "found": false}]}
{"file": "bummfilm.de.\u00fcber.html", "url": "http://bummfilm.de/page/index.php?scroll=%DCber", "text_len": 728, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die bumm film GmbH bietet", "found": false}, {"type": "with", "string": "und wurde im Laufe der Zeit", "found": false}, {"type": "with", "string": "Web und Live-Entertainment", "found": false}, {"type": "without", "string": "Kontakt", "found": false}, {"type": "without", "string": "Leistungen", "found": false}, {"type": "without", "string": "Lightbox2 \u00a9 Lokesh Dhakar", "found": false}]}
{"file": "thepostpartumparty.com.nursery.html", "url": "https://thepostpartumparty.com/how-to-set-up-a-baby-nursery-in-a-small-space", "text_len": 7444, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Pick products that can serve multiple purposes", "found": true}, {"type": "with", "string": "Sometimes space is in the eye of the beholder", "found": true}, {"type": "with", "string": "the idea of where to put everything can", "found": true}, {"type": "without", "string": "must-haves, and so much more.", "found": false}, {"type": "without", "string": "Notify me of follow-up comments by email.", "found": false}, {"type": "without", "string": "The Postpartum Party does not offer medical advice", "found": false}]}
{"file": "Sprzeciw wobec atak\u00f3w na Fundacj\u0119 Lux Veritatis - RadioMaryja.pl.html", "url": "https://www.radiomaryja.pl/informacje/sprzeciw-wobec-atakow-na-fundacje-lux-veritatis/", "text_len": 2205, "tp": 0, "fn": 3, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Watchdog wytoczy\u0142", "found": false}, {"type": "with", "string": "Nie mo\u017cemy pozwoli\u0107 na", "found": false}, {"type": "with", "string": "n\u0119kania Fundacji Lux Veritatis", "found": false}, {"type": "without", "string": "wi\u0119cej]", "found": false}, {"type": "without", "string": "drukuj", "found": false}, {"type": "without", "string": "RIRM", "found": true}]}
{"file": "lbv.de-Bavaria.html", "url": "https://www.lbv.de/news/details/lebenszeichen-von-bavaria-nach-zwei-monaten-funkstille/", "text_len": 6215, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "November ausgefallener Sender", "found": true}, {"type": "with", "string": "Ladestand von drei Prozent", "found": true}, {"type": "with", "string": "der GPS-Daten im G\u00e4stebuch", "found": true}, {"type": "without", "string": "Online-Fangemeinde war beunruhig", "found": false}, {"type": "without", "string": "zum Naturschutz in Bayern", "found": false}, {"type": "without", "string": "LBV-HOCHSCHULGRUPPEN:", "found": false}]}
{"file": "leichtathletik-ostalbkreis.de.1952007.html", "url": "https://blog.leichtathletik-ostalbkreis.de/2007/05/20/ergebnisse-rm-schuelerinnen-a-aalen-unterkochen-1952007/", "text_len": 106492, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "1. und Regionalmeister 2007", "found": true}, {"type": "with", "string": "Schlumberger, Lea 1993;", "found": true}, {"type": "with", "string": "LG Staufen", "found": true}, {"type": "without", "string": "LA-Kreis Ulm/Alb-Donau", "found": false}, {"type": "without", "string": "LA-Kreis G\u00f6ppingen", "found": false}, {"type": "without", "string": "LAC Essingen", "found": false}]}
{"file": "hundeverein-kreisunna.de.html", "url": "http://www.hundeverein-kreisunna.de/unserverein.html", "text_len": 2143, "tp": 2, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "Beate und Norbert Olschewski", "found": true}, {"type": "with", "string": "ein Familienmitglied und unser Freund.", "found": true}, {"type": "without", "string": "zur\u00fcck zur Startseite", "found": false}]}
{"file": "anwaltniemeyer.de.index.html", "url": "https://anwaltniemeyer.de/index.html", "text_len": 432, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Ich bin Jens-Christof", "found": true}, {"type": "with", "string": "Ich freue mich", "found": true}, {"type": "with", "string": "und mittelst\u00e4ndischen Unternehmen", "found": true}, {"type": "without", "string": "Fachanwalt f\u00fcr IT-Recht", "found": true}, {"type": "without", "string": "9, 32130 Enger", "found": true}, {"type": "without", "string": "Service", "found": false}]}
{"file": "losandes.com-mendoza.html", "url": "https://www.losandes.com.ar/sociedad/el-ano-de-las-evaluaciones-las-escuelas-de-mendoza-tendran-tres-relevamientos-de-calidad-educativa/", "text_len": 5338, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "escuelas mendocinas. El gobierno", "found": true}, {"type": "with", "string": "que se realizar\u00e1 en mayo,", "found": true}, {"type": "with", "string": "Evaluaci\u00f3n Internacional de Alumnos de", "found": true}, {"type": "without", "string": "TEMAS RELACIONADOS", "found": false}, {"type": "without", "string": "El mendocino que suma su ayuda", "found": false}, {"type": "without", "string": "Los ex\u00e1menes PISA en Mendoza se realizar\u00e1n", "found": false}]}
{"file": "unterwegsinberlin.de.friedrichsfelde.html", "url": "https://www.unterwegsinberlin.de/radtouren-berlin/radtour-durch-friedrichsfelde-karlshorst-und-schoeneweide/", "text_len": 4053, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Meine neue Lieblings-Radtour", "found": true}, {"type": "with", "string": "ca. 80 m links", "found": true}, {"type": "with", "string": "um das Gel\u00e4nde herum", "found": true}, {"type": "without", "string": "Klicken Sie auf den unteren", "found": true}, {"type": "without", "string": "Keine Lust alleine zu", "found": false}, {"type": "without", "string": "Kein Fahrrad zur Hand?", "found": false}]}
{"file": "tagesschau.de.rheinmetall.html", "url": "https://www.tagesschau.de/investigativ/ndr/rheinmetall-datenleck-101.html", "text_len": 6980, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "h NDR-Recherchen von einem Datenleck betroffen: Mehr als 1000 interne Unterlagen kursiere", "found": true}, {"type": "with", "string": "Der Datensatz liegt dem NDR vor.", "found": true}, {"type": "with", "string": "Rheinmetall stellt in den damals betroffenen Fabriken Bauteile f\u00fcr die Autoindustrie her.", "found": true}, {"type": "without", "string": "Darstellung", "found": false}, {"type": "without", "string": "Rundfunkanstalten", "found": false}, {"type": "without", "string": "Tagesschau Investigativ", "found": false}]}
{"file": "linkedin.com.hoeltmann.html", "url": "https://www.linkedin.com/pulse/ich-war-am-wochenende-auf-einer-hochzeit-im-wendland-inga-hoeltmann", "text_len": 3937, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das Wendland ist eine sch\u00f6ne, aber sehr l\u00e4ndliche", "found": true}, {"type": "with", "string": "hinnehmen als sei es nicht zu \u00e4ndern. Besch\u00e4mend.", "found": true}, {"type": "with", "string": "Konzepte abseits der urbanen R\u00e4ume in", "found": true}, {"type": "without", "string": "Einstellungen f\u00fcr Nichtmitglieder", "found": false}, {"type": "without", "string": "Nutzervereinbarung", "found": false}, {"type": "without", "string": "Markenrichtlinine", "found": false}]}
{"file": "theatlantic.com.disasters.html", "url": "https://www.theatlantic.com/ideas/archive/2020/08/californias-disasters-are-a-warning-climate-change-is-here/615610/", "text_len": 7025, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "When I moved to California five years ago", "found": true}, {"type": "with", "string": "Yet some people refuse to acknowledge that climate change", "found": true}, {"type": "with", "string": "happening in California has a name: climate change", "found": true}, {"type": "without", "string": "We want to hear what you think about this article.", "found": true}, {"type": "without", "string": "Some were blasted by critics, some flopped at the", "found": false}, {"type": "without", "string": "Subscribe and support 162 years of independent journalism", "found": false}]}
{"file": "zvei.org.messestellenbetriebsgesetz.html", "url": "https://www.zvei.org/presse-medien/pressebereich/messstellenbetriebsgesetz-endlich-klarheit-geschaffen ", "text_len": 1894, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wolfgang Weber, Vorsitzender", "found": true}, {"type": "with", "string": "Insbesondere ist hervorzuheben", "found": true}, {"type": "with", "string": "Der Entwurf kommt dennoch", "found": true}, {"type": "without", "string": "Weiterf\u00fchrende Informationen", "found": false}, {"type": "without", "string": "Folgen Sie uns", "found": false}, {"type": "without", "string": "Zur\u00fcck zur \u00dcbersicht", "found": false}]}
{"file": "mdr.de.autohaeuser.html", "url": "https://www.mdr.de/thueringen/corona-lockerung-autohaeuser-werkstatten-100.html", "text_len": 1820, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Gesch\u00e4ftes. Helmut Peter von der gleichnamigen Autohaus-Gruppe sagte MDR TH\u00dcRINGEN am Mo", "found": true}, {"type": "with", "string": "ann. Nach Informationen von MDR TH\u00dcRINGEN hatte ein VW-H\u00e4ndler in Erfurt bis Montagmorgen nicht gewusst, dass er wieder Kunden im Autohaus beraten darf. Ein BMW-H\u00e4ndler in Weimar erkl\u00e4rte, auch in d", "found": true}, {"type": "with", "string": "am Montag, die H\u00e4ndler seien froh, dass sie wieder die Verkaufsr\u00e4ume \u00f6ffnen d\u00fcrften. Allerdings se", "found": true}, {"type": "without", "string": "Weitere Informationen zum Coronavirus in Th\u00fcringen:", "found": true}, {"type": "without", "string": "Mehr aus Th\u00fcringen", "found": false}, {"type": "without", "string": "Der Mitteldeutsche Rundfunk ist Mitglied der ARD.", "found": false}]}
{"file": "wevolver.com.3dprinting.html", "url": "https://www.wevolver.com/article/3dprinting.gets.a.turbo.boost.from.um.technology", "text_len": 3461, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The algorithm allows printers to deliver high-quality results", "found": true}, {"type": "with", "string": "Chinedum Okwudire", "found": true}, {"type": "with", "string": "vibration-induced error compensation of a 3D printer", "found": true}, {"type": "without", "string": "Search for articles and topics", "found": false}, {"type": "without", "string": "Create smart machines.", "found": false}, {"type": "without", "string": "We reach millions of professional engineers", "found": false}]}
{"file": "bundespolizei.de-Belarus.html", "url": "https://www.bundespolizei.de/Web/DE/04Aktuelles/01Meldungen/2021/10/staendige_aktualisierung_migrationslage.html;jsessionid=51A21717FEF5DF385B5C87C9E5FABD92.2_cid324", "text_len": 2187, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Die deutsch-polnische Grenze", "found": true}, {"type": "with", "string": "Bei Personen, die unerlaubt", "found": true}, {"type": "with", "string": "Lesen Sie dazu auch die", "found": true}, {"type": "without", "string": "Illegale Migration aus Belarus \u00fcber", "found": true}, {"type": "without", "string": "Seite drucken", "found": false}, {"type": "without", "string": "So erreichen Sie uns:", "found": false}]}
{"file": "internetchemie.info.Heliumkerne.html", "url": "https://internetchemie.info/news/2021/jan21/heliumkerne-in-zinn-atomen-entdeckt.php", "text_len": 5663, "tp": 2, "fn": 1, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Darmstadt - Januar 2021", "found": true}, {"type": "with", "string": "Im Detail:", "found": false}, {"type": "with", "string": "Die von Tanaka et al", "found": true}, {"type": "without", "string": "Zusatzinformationen:", "found": true}, {"type": "without", "string": "About", "found": false}, {"type": "without", "string": "Aktualisiert am", "found": true}]}
{"file": "ga.de-Graffiti.html", "url": "https://ga.de/bonn/beuel/mural-in-bonn-graffiti-an-stiftung-gemeindepsychatrie-in-beuel_aid-99369101", "text_len": 3067, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Riesengro\u00dfe K\u00f6pfe im Profil", "found": false}, {"type": "with", "string": "ein Mann mit rotem Hut ist schemenhaft \u00fcber den Kopf", "found": false}, {"type": "with", "string": "einer Frau mit geflochtenem Zopf in Blau gelegt", "found": false}, {"type": "without", "string": "Jetzt weiterlesen mit", "found": false}, {"type": "without", "string": "Wir liefern mit anspruchsvollem, modernem Journalismus die Informationen", "found": false}, {"type": "without", "string": "die f\u00fcr Menschen in unserer Region wichtig sind.", "found": false}]}
{"file": "sprechblase.wordpress.com.zapfsaeulen.html", "url": "https://sprechblase.wordpress.com/2019/11/17/elektro-zapfsaeulen/", "text_len": 447, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich w\u00fcrde ja", "found": true}, {"type": "with", "string": "Drumrum und Service", "found": true}, {"type": "with", "string": "Ich bedanke mich", "found": true}, {"type": "without", "string": "Life is not digital", "found": false}, {"type": "without", "string": "Bewerten:", "found": false}, {"type": "without", "string": "Micro-Series: Born Entrepreneurs", "found": false}]}
{"file": "archive.org.nesselsetzer.wordpress.com.antipoden.html", "url": "https://web.archive.org/web/20140109030403/http://nesselsetzer.wordpress.com/2013/12/09/rebloggt-von-gnaddrig-ad-libitum-antipoden-die-wahrheit/", "text_len": 1417, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gnaddrigs erstaunliche Betrachtungsweise und die Entwicklung einer Theorie", "found": true}, {"type": "with", "string": "ob auf der anderen Seite der Erde \u00fcberhaupt Menschen leben k\u00f6nnen.", "found": true}, {"type": "with", "string": "musste so sein, weil wir hier ja nachweislich mit den F\u00fc\u00dfen nach unten und dem Kopf nach oben herumlaufen", "found": true}, {"type": "without", "string": "Die d\u00fcmmste aller Verschw\u00f6rungstheorien: Chemtrails", "found": false}, {"type": "without", "string": "Gef\u00e4llt mir", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}]}
{"file": "Windows 10 od lipca przestanie obs\u0142ugiwa\u0107 Adobe Flash.html", "url": "https://spidersweb.pl/2021/05/windows-10-flash.html", "text_len": 2313, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "W pa\u017adzierniku na", "found": true}, {"type": "with", "string": "wspomniane cyberbezpiecze\u0144stwo.", "found": true}, {"type": "with", "string": "nigdy go nie obs\u0142ugiwa\u0142y.", "found": true}, {"type": "without", "string": "do dyskusji", "found": false}, {"type": "without", "string": "U\u017cywamy informacji zapisanych", "found": false}, {"type": "without", "string": "UDOST\u0118PNIJ", "found": false}]}
{"file": "weisser-ring.de-Erfolgsgechichte.html", "url": "https://weisser-ring.de/media-news/meldungen/29-10-2021", "text_len": 1441, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "bundesweiten Einbruchschutzkampagne K-EINBRUCH", "found": true}, {"type": "with", "string": "seit 2015 kontinuierlich", "found": true}, {"type": "with", "string": "Wenn Sie Ihr Haus verlassen", "found": false}, {"type": "without", "string": "Foto: www.k-einbruch.de", "found": false}, {"type": "without", "string": "Zur\u00fcck zur \u00dcbersicht", "found": false}, {"type": "without", "string": "Startseite", "found": false}]}
{"file": "swim.de-ga2.html", "url": "https://swim.de/training/lagen-pyramide-mit-ga2/", "text_len": 1628, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "W\u00e4hlen Sie \u00dcbungen, bei denen Sie sich", "found": true}, {"type": "with", "string": "vierten Stufe d\u00fcrfen Sie entscheiden,", "found": true}, {"type": "with", "string": "H\u00e4lfte der Teilstrecke in", "found": true}, {"type": "without", "string": "studierte Sportwissenschaften, bevor", "found": false}, {"type": "without", "string": "Starker Serienauftakt in der", "found": false}, {"type": "without", "string": "Wenn du auf den Abo-Button klickst, verpasst", "found": false}]}
{"file": "5min.at-Villachs.html", "url": "https://www.5min.at/5lokales/villachs-meister-proper-expandiert-nach-wien/", "text_len": 2206, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Chef Boris Dujakovic gr\u00fcndete Filana", "found": true}, {"type": "with", "string": "vor \u00fcber vier Jahren als Hausmeisterservice", "found": true}, {"type": "with", "string": "In den letzten 2 Jahren hat er sich aber vor allem auf Grundreinigung", "found": true}, {"type": "without", "string": "Mehr Interessantes", "found": false}, {"type": "without", "string": "Wetter aktuell", "found": false}, {"type": "without", "string": "Meistgeklickt", "found": false}]}
{"file": "rechtambild.de.kochbuch.html", "url": "https://www.rechtambild.de/2011/10/bgh-marions-kochbuch-de/", "text_len": 26543, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Leits\u00e4tze des Gerichts", "found": true}, {"type": "with", "string": "III. Die Revision der Beklagten", "found": true}, {"type": "without", "string": "twittern", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "d.toelle[at]rechtambild.de", "found": false}]}
{"file": "columbus-entdeckt.de.trolls.html", "url": "http://columbus-entdeckt.de/ski-fahren-auf-den-spuren-des-trolls/", "text_len": 610, "tp": 3, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "Island lockt auch im Winter", "found": true}, {"type": "with", "string": "Das gr\u00f6\u00dfte in Akureyri hat f\u00fcnf Lifte", "found": true}, {"type": "with", "string": "und auf den Spuren des Trolls", "found": true}, {"type": "without", "string": "Die besten Reisegeschichten", "found": false}]}
{"file": "it-finanzmagazin.de.creditshelf.html", "url": "https://www.it-finanzmagazin.de/creditshelf-kooperiert-mit-finleap-und-plant-akquisition-der-valendo-gmbh-90871/", "text_len": 3616, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die geplante Kooperation von creditshelf mit finleap", "found": true}, {"type": "with", "string": "Beide Parteien streben den Abschluss des Erwerbs der Valendo", "found": true}, {"type": "with", "string": "creditshelf er\u00f6ffnet die geplante Akquisition der Valendo GmbH", "found": true}, {"type": "without", "string": "Jede Woche neu:", "found": false}, {"type": "without", "string": "(Noch keine Bewertungen)", "found": false}, {"type": "without", "string": "Auch interessant", "found": false}]}
{"file": "fouryears.eu.interning.html", "url": "http://fouryears.eu/2019/10/21/interning-of-small-integers-in-python/", "text_len": 448, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Note that depending on the version of Python the value of the integer", "found": true}, {"type": "with", "string": "lovely example, illustrating the way Python", "found": true}, {"type": "with", "string": "(addr, ctypes.", "found": true}, {"type": "without", "string": "Best western clearfield pa on Skype \"removed\" messages", "found": false}, {"type": "without", "string": "6 Regularization Techniques for Deep Learning", "found": false}, {"type": "without", "string": "Konstantin on ROC Area-Under-the-Curve Explained", "found": false}]}
{"file": "amnesty.de-waffensysteme.html", "url": "https://www.amnesty.de/allgemein/pressemitteilung/autonome-waffensysteme-gefahr-menschenrechte", "text_len": 4615, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "die globale Kampagne", "found": true}, {"type": "with", "string": "wird zu verheerenden Verst\u00f6\u00dfen", "found": true}, {"type": "with", "string": "nationalen Nichtregierungsorganisationen", "found": true}, {"type": "without", "string": "Wir respektieren deine Privatsph\u00e4re", "found": false}, {"type": "without", "string": "Aktuell", "found": false}, {"type": "without", "string": "Getty Images", "found": true}]}
{"file": "jungle.world-Imperialismus-Phantom.html", "url": "https://jungle.world/artikel/2023/43/diskussion-begriff-imperialismus-das-phantom", "text_len": 10182, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In den vergangenen 100 Jahren", "found": true}, {"type": "with", "string": "war noch nie so viel von Imperialismus die Rede wie heute", "found": true}, {"type": "with", "string": "und zwar quer durch die politischen Lager", "found": true}, {"type": "without", "string": "Artikel zum Thema", "found": false}, {"type": "without", "string": "Die Hamas und die blinden Flecken der Linken", "found": false}, {"type": "without", "string": "Imperialismustheorie statt Antiimperialismus", "found": false}]}
{"file": "miamitodaynews.com-Transitway.html", "url": "https://www.miamitodaynews.com/2023/11/07/transit-tax-trust-rejects-countys-south-dade-transitway-data/", "text_len": 5986, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Also delaying the response, Mr. Cueto said", "found": true}, {"type": "with", "string": "was that the county made the video presentation and then briefed", "found": true}, {"type": "with", "string": "accurate and is aligned with those funding partners", "found": true}, {"type": "without", "string": "South Dade rapid transit will be rapid in only one direction", "found": false}, {"type": "without", "string": "Send South Dade Transitway back to square one, trust urged", "found": false}, {"type": "without", "string": "County vowed a transit Rolls Royce; we\u2019re getting a Ford", "found": false}]}
{"file": "kulturkaufhaus.de-basteln.html", "url": "https://www.kulturkaufhaus.de/de/kultur-magazin/blogDetail/DIY-Farbbuch-artcBlog?bpmctrl=bpmrownr.1%7Cforeign.323438-1-0-267787", "text_len": 2043, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "wie man ein B\u00fcchlein aus einem A3", "found": true}, {"type": "with", "string": "1 Wasserglas mit Wasser", "found": true}, {"type": "with", "string": "wenn ihr unser DIY nachbastelt", "found": true}, {"type": "without", "string": "Kategorien", "found": false}, {"type": "without", "string": "Du m\u00f6chtest in Ruhe nachbasteln?", "found": false}, {"type": "without", "string": "Zuletzt besuchte Seiten", "found": false}]}
{"file": "jovelstefan.de.gefallt.html", "url": "http://www.jovelstefan.de/2011/09/11/gefallt-mir/", "text_len": 369, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Manchmal \u00fcberrascht einen", "found": true}, {"type": "with", "string": "kein Meisterwerk war!", "found": true}, {"type": "without", "string": "Pingback von", "found": false}, {"type": "without", "string": "Kommentare geschlossen", "found": false}]}
{"file": "luxuryhaven.co.hyatt.html", "url": "https://www.luxuryhaven.co/2019/05/nam-nghi-phu-quoc-unbound-collection-by-hyatt-officially-opens.html", "text_len": 4358, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Grounded in sustainable architecture and refined Vietnamese craftsmanship,", "found": true}, {"type": "with", "string": "and Carmelo Resort", "found": true}, {"type": "with", "string": "Dining and Drinking", "found": true}, {"type": "without", "string": "Food Advertising by", "found": false}, {"type": "without", "string": "A lovely note makes a beautiful day!", "found": false}, {"type": "without", "string": "Reply", "found": false}]}
{"file": "advents-shopping.de.weihnachtsmaerkte.html", "url": "https://www.advents-shopping.de/die-weihnachtsmarkt-saison-beginnt-so-finden-sie-die-besten-weihnachtsmaerkte-in-ihrer-naehe.html", "text_len": 1781, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "P\u00fcnktlich mit dem Beginn der", "found": true}, {"type": "with", "string": "Ein neues Layout stellt sicher", "found": true}, {"type": "with", "string": "ein kostenlose Webapplikation", "found": true}, {"type": "without", "string": "Ihr weihnachtlicher Kurzurlaub", "found": false}, {"type": "without", "string": "Advents-Shopping.de nimmt Sie mit in die", "found": false}, {"type": "without", "string": "o finden Sie die besten Weihnachtsm\u00e4rkte", "found": true}]}
{"file": "d27eb719099b43639104995806e07d00.html", "url": "https://www.mopo.de/sport/hsv/fuer-den-hsv-in-der-oberliga--jansen-kaempft-um-trochowskis-comeback-33334622", "text_len": 2002, "tp": 3, "fn": 0, "fp": 0, "tn": 5, "details": [{"type": "with", "string": "k\u00fcnftig wieder f\u00fcr den HSV auf? ", "found": true}, {"type": "with", "string": "Es bringt riesigen Spa\u00df, die Liga hat sehr viel Tradition", "found": true}, {"type": "with", "string": "Oberliga ist keine Pillepalle-Liga", "found": true}, {"type": "without", "string": "haben einen guten Draht.", "found": false}, {"type": "without", "string": "4 Tsd. Abonnenten", "found": false}, {"type": "without", "string": "Kommentieren Sie hier", "found": false}, {"type": "without", "string": "URL zum Kopieren", "found": false}, {"type": "without", "string": "Messenger", "found": false}]}
{"file": "villagersandheroes.com.forums.patchnotes.html", "url": "https://villagersandheroes.com/forums/threads/patchnotes-4-47-4-tagundnachtgleiche-bugfix-build.3976/", "text_len": 8952, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Farbe der Spawn-Ank\u00fcndigungen wurde ge\u00e4ndert auf orange", "found": true}, {"type": "with", "string": "erh\u00f6hen, zum Schaden aber nur begrenzt beitragen, entsteht.", "found": true}, {"type": "with", "string": "Was jeder von Euch daraus nun f\u00fcr Konsequenzen zieht in Eventzonen", "found": true}, {"type": "without", "string": "Forum software by XenForo\u00ae \u00a9 2010-2019 XenForo Ltd.", "found": false}, {"type": "without", "string": " Terms and rules", "found": false}, {"type": "without", "string": " Privacy policy", "found": false}]}
{"file": "n-land.de-Simmelsdorf.html", "url": "https://n-land.de/top-story/74-jaehriger-stirbt-nach-unfall-in-simmelsdorf", "text_len": 626, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gegen\u00fcber einer Verkehrsteilnehmerin", "found": true}, {"type": "with", "string": "die sich mit ihrem Fahrzeug hinter dem Pkw-Fahrer befand", "found": true}, {"type": "with", "string": "gab er gesundheitliche Probleme an und verlor das Bewusstsein", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "Unbekannter stiehlt mehrere E-Bikes aus Kellerabteilen in Altdorf", "found": false}, {"type": "without", "string": "\u00dcber drei Promille: Alkoholisierter Fahrer baut Unfall in Lauf", "found": false}]}
{"file": "sprechwaisen.com.sw082.html", "url": "http://www.sprechwaisen.com/sw082-82-gruende-zum-weiter-hoeren/", "text_len": 391, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ingo hat ja gesagt", "found": true}, {"type": "with", "string": "Oder damit Petra", "found": true}, {"type": "with", "string": "\u00c4u\u00dfert Vermutungen", "found": true}, {"type": "without", "string": "Deine E-Mail-Adresse", "found": false}, {"type": "without", "string": "Der geheimnisvolle Button", "found": false}, {"type": "without", "string": "This entry was posted ", "found": false}]}
{"file": "acpjournals.org.3075.html", "url": "https://www.acpjournals.org/doi/10.7326/M19-3075", "text_len": 14731, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "cination reduces hospitalizations and mortality among elderly persons. Acc", "found": true}, {"type": "with", "string": "ged 55 to 75 years residing in the study area during 2000 to 2014.", "found": true}, {"type": "with", "string": "Primary Funding Source:", "found": true}, {"type": "without", "string": "ACP Journals home", "found": false}, {"type": "without", "string": "Institutions / Libraries / Agencies", "found": false}, {"type": "without", "string": "2020 American College of", "found": false}]}
{"file": "trome.pe-chollywood.html", "url": "https://trome.pe/espectaculos/dia-de-la-madre-trome-celebro-con-las-mamitas-de-chollywood-magaly-medina-janet-barboza-noticia/", "text_len": 4427, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "porque siempre fui muy estudiosa,", "found": true}, {"type": "with", "string": "descubrir\u00eda, pues no iba as\u00ed nom\u00e1s a mi", "found": true}, {"type": "with", "string": "culp\u00e9 a mi hermano, pero finalmente", "found": true}, {"type": "without", "string": "Silvia N\u00fa\u00f1ez del Arco: \u201cJaime", "found": true}, {"type": "without", "string": "y origen de su apodo", "found": true}, {"type": "without", "string": "cont\u00f3 la historia de un flan, que se comi\u00f3 en su infancia.", "found": false}]}
{"file": "buero-hoppe.de.baumgutachten.html", "url": "http://www.buero-hoppe.de/baumgutachten.htm", "text_len": 4387, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Die Erstellung von Baumgutachten", "found": true}, {"type": "with", "string": "Es gibt eine Vielzahl von Gr\u00fcnden", "found": true}, {"type": "with", "string": "Baumkataster eine sinnvolle Investition.", "found": true}, {"type": "without", "string": "Um unsere Webseite f\u00fcr Sie", "found": false}, {"type": "without", "string": "Leistungen und Informationen im", "found": true}, {"type": "without", "string": "Planungsb\u00fcro G. & L. Hoppe", "found": true}]}
{"file": "evref.ch-\u00f6kumene.html", "url": "https://www.evref.ch/oekumene-trifft-diplomatie-aussenminister-cassis-und-kardinalstaatssekretaer-parolin-besuchen-synode-der-eks/", "text_len": 4113, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In ihren Grussw\u00f6rtern", "found": false}, {"type": "with", "string": "Cassis auf die parlamentarische", "found": true}, {"type": "with", "string": "Pr\u00e4sidentin Rita Famos \u00fcberreichte", "found": true}, {"type": "without", "string": "Stefan Wermuth", "found": false}, {"type": "without", "string": "Aktuelles", "found": false}, {"type": "without", "string": "Bilder des Treffens", "found": false}]}
{"file": "bergsteigen.com-skibergsteigen.html", "url": "https://www.bergsteigen.com/produkte/skibergestiegen-schnell-und-leicht-mit-den-camp-neuheiten/", "text_len": 4262, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Fixer Aluminiumstock", "found": true}, {"type": "with", "string": "ambitionierte Skibergsteiger, die", "found": true}, {"type": "with", "string": " X-Press-Hauptskihalter mit innovativem", "found": true}, {"type": "without", "string": "KOMMENTARE", "found": false}, {"type": "without", "string": "KOMMENDE TERMINE", "found": false}, {"type": "without", "string": "One Love \u2013 Babsi Zangerl und Jacopo Larcher", "found": false}]}
{"file": "spektrum.de.coronavirus.html", "url": "https://www.spektrum.de/wissen/laesst-sich-die-coronavirus-ausbreitung-in-deutschland-kontrollieren/1700384", "text_len": 31378, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In Baden-W\u00fcrttemberg und NRW", "found": false}, {"type": "with", "string": "Ein Problem: So viele Berichte und Nachrichten", "found": true}, {"type": "with", "string": "Viele Menschen haben nur eine leichte", "found": true}, {"type": "without", "string": "Wenn Sie inhaltliche Anmerkungen zu", "found": false}, {"type": "without", "string": "Bleiben Sie auf dem Laufenden", "found": false}, {"type": "without", "string": "Lesedauer ca. 6", "found": false}]}
{"file": "talent.ch.5031.html", "url": "https://www.talent.ch/?p=5031", "text_len": 3492, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Abnahme Protokoll der letzten Vorstandssitzung", "found": true}, {"type": "with", "string": "Johannes schickt seinen Entwurf f\u00fcr einen", "found": true}, {"type": "with", "string": "Daniel sucht nach M\u00f6glichkeiten", "found": true}, {"type": "without", "string": "M\u00f6chtest du TALENT einfach nur", "found": false}, {"type": "without", "string": "Oder du \u00fcberweisst deine Spende", "found": false}, {"type": "without", "string": "Es gibt derzeit keine bevorstehenden Veranstaltungen.", "found": false}]}
{"file": "ukbdnews.com.23646.html", "url": "https://ukbdnews.com/2020/08/23646/", "text_len": 1079, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u0995\u09c1\u09b7\u09cd\u099f\u09bf\u09af\u09bc\u09be-\u09e7 (\u09a6\u09cc\u09b2\u09a4\u09aa\u09c1\u09b0) \u0986\u09b8\u09a8\u09c7\u09b0 \u09b8\u0982\u09b8\u09a6 \u09b8\u09a6\u09b8\u09cd\u09af (\u098f\u09ae\u09aa\u09bf) \u0985\u09cd\u09af\u09be\u09a1\u09ad\u09cb\u0995\u09c7\u099f", "found": true}, {"type": "with", "string": "\u0986\u099c \u09b6\u09a8\u09bf\u09ac\u09be\u09b0 (\u09e8\u09ef \u0986\u0997\u09b8\u09cd\u099f) \u09b8\u0995\u09be\u09b2 \u09b8\u09be\u09a1\u09bc\u09c7 \u09ed\u099f\u09be\u09b0", "found": true}, {"type": "without", "string": "\u0995\u09b0\u09cb\u09a8\u09be\u09af\u09bc \u0986\u09b0\u0993 \u09e9\u09e8 \u099c\u09a8\u09c7\u09b0 \u09ae\u09c3\u09a4\u09cd\u09af\u09c1, \u09a8\u09a4\u09c1\u09a8 \u09b6\u09a8\u09be\u0995\u09cd\u09a4 \u09e8\u09e7\u09e9\u09e7", "found": false}, {"type": "without", "string": "\u0987\u09ad\u09cd\u09af\u09be\u09b2\u09bf\u09b0 \u09b8\u09bf\u0987\u0993 \u09b0\u09be\u09b8\u09c7\u09b2\u09c7\u09b0", "found": false}, {"type": "without", "string": " \u0986\u0997\u09b8\u09cd\u099f \u09e8\u09ef", "found": false}]}
{"file": "golfpost.de-premiere.html", "url": "https://www.golfpost.de/golf-im-tv-777789172/", "text_len": 1969, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nach zuvor zwei Rolex-Series-Events", "found": true}, {"type": "with", "string": "Kalifornien, die DP World Tour", "found": false}, {"type": "with", "string": "Deutsche um Max Kieffer, Matti Schmid", "found": true}, {"type": "without", "string": "Jetzt f\u00fcr Golf-Lotse Top-News anmelden", "found": false}, {"type": "without", "string": "News rund um PGA Tour", "found": false}, {"type": "without", "string": "\u00dcberblick. (Foto: Getty)", "found": false}]}
{"file": "vice.com.amazon.html", "url": "https://www.vice.com/en_uk/article/d3avvm/the-amazon-is-on-fire-and-the-smoke-can-be-seen-from-space", "text_len": 3491, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Brazil went dark.", "found": true}, {"type": "with", "string": "the highest number of deforestation warnings.\u201d", "found": true}, {"type": "without", "string": "Tagged:", "found": false}, {"type": "without", "string": "to the VICE newsletter.", "found": false}, {"type": "without", "string": "Watch this next", "found": false}]}
{"file": "de.induux.com.energiezaehler.html", "url": "https://de.induux.com/4press/energiezaehler-m-bus-mod-bus-ethernet-mid-3999/", "text_len": 2078, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Lovato Elctric erweitert sein umfangreiches Produktprogramm im Bereich E-Managemnt jetzt mit Ger\u00e4te die f\u00fcr den deutschen Markt besonders interessant sind.", "found": true}, {"type": "with", "string": "0,5s Genauigkeitsklasse", "found": true}, {"type": "with", "string": "Nennversorgungsspannung: 380...415VAC (L-L)", "found": true}, {"type": "without", "string": "Angebote Lovato Electric", "found": false}, {"type": "without", "string": "Die internationale Industrie-Plattform", "found": false}, {"type": "without", "string": "Karriere", "found": false}]}
{"file": "soundofscience.fr.1927.html", "url": "https://www.soundofscience.fr/1927", "text_len": 7576, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "En r\u00e9action \u00e0 la candidature", "found": true}, {"type": "with", "string": "Une cible,", "found": true}, {"type": "with", "string": "Sans recherche autonome,", "found": true}, {"type": "without", "string": "Image illustrative", "found": true}, {"type": "without", "string": "Votre adresse de messagerie", "found": false}, {"type": "without", "string": "Le montage du CNRS", "found": false}]}
{"file": "ekd.de-Friedensdekade.html", "url": "https://www.ekd.de/andacht-zur-friedensdekade-in-der-kaiser-wilhelm-69810.htm", "text_len": 5333, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bevollm\u00e4chtigter des", "found": true}, {"type": "with", "string": "mit euch und Friede", "found": true}, {"type": "with", "string": "unerschrocken und furchtlos", "found": true}, {"type": "without", "string": "SCHWERPUNKTE DER EKD", "found": false}, {"type": "without", "string": "Sie suchen Fakten", "found": false}, {"type": "without", "string": "Deswegen haben wir", "found": false}]}
{"file": "liquimoly-hbl.de-cheftrainer.html", "url": "https://www.liquimoly-hbl.de/de/n/news/2--liga/2021-22/transfers/tsv-bayer-dormagen/neuer-cheftrainer-fuer-dormagen--matthias-flohr-uebernimmt-ab-sommer-2022/", "text_len": 2720, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "mit einer bestens motivierten Mannschaft den", "found": true}, {"type": "with", "string": "Haases breitem Netzwerk. Auch heimische", "found": true}, {"type": "with", "string": "aber ich habe ein gutes Gef\u00fchl", "found": true}, {"type": "without", "string": "Verwandte Themen", "found": false}, {"type": "without", "string": "Coburg", "found": false}, {"type": "without", "string": "#diewiesel", "found": false}]}
{"file": "presse-ausburg.de-Tarifverbund.html", "url": "https://presse-augsburg.de/augsburger-verkehrs-und-tarifverbund-avv-erhoeht-die-oepnv-preise-deutlich/909665/", "text_len": 2863, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir m\u00fcssen insbesondere die stark gestiegenen Kosten", "found": true}, {"type": "with", "string": "f\u00fcr Energie und Kraftstoff an die Verkehrsunternehmer ausgleichen", "found": true}, {"type": "with", "string": "um die Grundlage zu schaffen", "found": true}, {"type": "without", "string": "Jetzt Singles finden", "found": false}, {"type": "without", "string": "Nachrichten f\u00fcr Augsburg und Bayerisch-Schwaben.", "found": false}, {"type": "without", "string": "Pro Asyl nennt EU-Migrationsdeal \u201ehistorischen Tiefpunkt\u201c", "found": false}]}
{"file": "wbf.admin.ch.14093.html", "url": "https://www.wbf.admin.ch/wbf/de/home/dokumentation/nsb-news_list.msg-id-14093.html", "text_len": 14413, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "beim SP-St\u00e4dtegipfel", "found": true}, {"type": "with", "string": "Dies f\u00fchrt dazu, dass die Sozialpolitik", "found": true}, {"type": "with", "string": "wie in der Nationalhymne,", "found": true}, {"type": "without", "string": "Kommunikationsdienst", "found": false}, {"type": "without", "string": "Letzte \u00c4nderung", "found": true}, {"type": "without", "string": "Informiert bleiben", "found": false}]}
{"file": "zdh.de-foerderungsstopp.html", "url": "https://www.zdh.de/presse/veroeffentlichungen/pressemitteilungen/kfw-foerderungsstopp-ist-klimapolitisch-fatales-signal/", "text_len": 2169, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "und nicht akzeptabel ist, dass", "found": true}, {"type": "with", "string": " Bundesregierung aufgefordert, verl\u00e4ssliche", "found": true}, {"type": "with", "string": "CO2-Minderungs- und Klimaschutzziele so wichtig", "found": true}, {"type": "without", "string": "Schlagworte", "found": false}, {"type": "without", "string": "Foto: unsplash/Bill Mead", "found": false}, {"type": "without", "string": "Energiewende", "found": false}]}
{"file": "dtb-tennis.de-nominiert.html", "url": "https://www.dtb-tennis.de/Tennis-International/Davis-Cup/News-Features/Davis-Cup-Qualifiers-Kohlmann-nominiert-zwei-Neulinge", "text_len": 5120, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Michael Kohlmann hat die Mannschaft f\u00fcr die Davis Cup-Qualifiers", "found": true}, {"type": "with", "string": "Dass auch Kevin Krawietz und Tim P\u00fctz mit ihrer makellosen", "found": true}, {"type": "with", "string": "Gespielt werden Dreisatz-Matches mit", "found": true}, {"type": "without", "string": "Kohlmann: \u201eAls n\u00e4chstes gewinnen wir den Davis Cup\u201c", "found": false}, {"type": "without", "string": "ZUR\u00dcCK NACH OBEN ", "found": false}, {"type": "without", "string": "DTB nominiert Porsche Nachwuchsteams f\u00fcr 2022", "found": false}]}
{"file": "wind-energie.de.beschleunigung.html", "url": "https://www.wind-energie.de/presse/pressemitteilungen/detail/endlich-mehr-beschleunigung-wagen/", "text_len": 2480, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Innerhalb ihres ersten Jahres hat", "found": false}, {"type": "with", "string": "Eine Erhebung der Fachagentur Windenergie an Land", "found": true}, {"type": "with", "string": "Zu weiteren Komplikationen tr\u00e4gt", "found": true}, {"type": "without", "string": "Ihr Ansprechpartner f\u00fcr Pressefragen", "found": false}, {"type": "without", "string": "Tel.:", "found": false}, {"type": "without", "string": "EUREF-Campus 16", "found": false}]}
{"file": "recyclingmagazin.de.lithium.html", "url": "https://www.recyclingmagazin.de/2022/12/12/europas-erste-lithium-rueckgewinnungsanlage-in-nrw/", "text_len": 970, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Anlage mit einem geplanten", "found": true}, {"type": "with", "string": "Seit etwa 8 Jahren", "found": true}, {"type": "with", "string": "Accurec wird mit der HydroLiC-Technologie", "found": true}, {"type": "without", "string": "TEILEN", "found": false}, {"type": "without", "string": "VERWANDTE ARTIKEL", "found": false}, {"type": "without", "string": "Letzte Meldungen", "found": false}]}
{"file": "nachtkritik.de-Dragqueens.html", "url": "https://nachtkritik.de/kolumnen-georg-kasch/kolumne-queer-royal-ueber-dragqueens-und-dragkings-auf-und-jenseits-der-buehne", "text_len": 6025, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Woher kommt eigentlich der Hass auf Dragqueens?", "found": true}, {"type": "with", "string": "Fr\u00fcher, als Travestiek\u00fcnstler wie Georg Preu\u00dfe", "found": true}, {"type": "with", "string": "und Reiner Kohler noch als Mary und Gordy die B\u00fchnen beherrschten", "found": true}, {"type": "without", "string": "neueste kommentare", "found": false}, {"type": "without", "string": "mehr Kolumnen", "found": false}, {"type": "without", "string": "impressum & kontakt", "found": false}]}
{"file": "t3n.de-Laufzeit.html", "url": "https://t3n.de/news/apple-eigener-iphone-akku-1587177/", "text_len": 3599, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Laut ET-News ziele Apple darauf ab", "found": true}, {"type": "with", "string": "innovative Batterien zu entwickeln, die bisher weltweit noch nicht kommerzialisiert wurden", "found": true}, {"type": "with", "string": "Die Nachfrage nach Hochleistungsbatterien ist mit der Erweiterung", "found": true}, {"type": "without", "string": "Spreading knowledge & future optimism.", "found": false}, {"type": "without", "string": "Verpasse keine News zu Hardware & Gadgets", "found": false}, {"type": "without", "string": "Foldables von Apple? Der Fokus soll derzeit noch woanders liegen", "found": false}]}
{"file": "github.blog.spiceland.html", "url": "https://github.blog/2019-03-29-leader-spotlight-erin-spiceland/", "text_len": 4495, "tp": 4, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Erin Spiceland is a Software Engineer for SpaceX.", "found": true}, {"type": "with", "string": "make effective plans and goals for the future", "found": true}, {"type": "with", "string": "looking forward to next?", "found": true}, {"type": "with", "string": "Research Consultant at Adelard LLP", "found": true}, {"type": "without", "string": "Related posts", "found": false}, {"type": "without", "string": "Jeremy Epling", "found": false}, {"type": "without", "string": "Missed the main event?", "found": false}, {"type": "without", "string": "Privacy", "found": false}]}
{"file": "murdeltas.wordpress.com.politcamp.html", "url": "https://murdeltas.wordpress.com/2015/04/05/barcamp-graz-2015-politcamp-call-for-action/", "text_len": 2190, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Leute, die in Zukunft das Barcamp", "found": true}, {"type": "with", "string": "Ein Zeichen dieser Ver\u00e4nderung", "found": true}, {"type": "with", "string": "In nicht mehr ganz 2 Wochen", "found": true}, {"type": "without", "string": "Ich bin ein linker Webterrorist", "found": false}, {"type": "without", "string": "Flattr this:", "found": false}, {"type": "without", "string": "Dieses Blog steht unter", "found": false}]}
{"file": "d76cf81a74fa4633bd19d7060f5c05ee.html", "url": "https://www.hessenschau.de/kultur/buchmesse/buecher-autoren/die-minze-als-mutmacher--deniz-yuecels-bericht-aus-dem-tuerkischen-knast,deniz-yuecel-buchmesse-agentterrorist-100.html", "text_len": 3414, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gef\u00e4ngnis \u2013 im Auftrag der \u00d6ffentlichkeit", "found": true}, {"type": "with", "string": "diese triste Umgebung schlug Deniz Y\u00fccel aufs Gem\u00fct", "found": true}, {"type": "with", "string": "Verfasst mithilfe von Tomatenso\u00dfe und einer Plastikgabel", "found": true}, {"type": "without", "string": "Navigation der Marken des Hessischen Rundfunks", "found": false}, {"type": "without", "string": "Weitere Informationen ", "found": false}, {"type": "without", "string": "Frankfurter Buchmesse 2019", "found": false}]}
{"file": "flawlessfood.co.uk.olive.html", "url": "https://flawlessfood.co.uk/olive-herb-focaccia-bread/", "text_len": 6190, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Oven-baked Italian Olive & Herb Focaccia", "found": true}, {"type": "with", "string": "oil mixture for dipping the focaccia bread into.", "found": false}, {"type": "with", "string": "Carbohydrates: 31g", "found": false}, {"type": "without", "string": "email address will not be published. Required fields", "found": false}, {"type": "without", "string": "We occasionally get sponsored by products, we", "found": false}, {"type": "without", "string": "We publish new recipes weekly, so keep", "found": false}]}
{"file": "spdfraktion.de-Vizepr\u00e4sidentin.html", "url": "https://www.spdfraktion.de/themen/aydan-oezoguz-vizepraesidentin", "text_len": 608, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "ist zur stellvertretenden Pr\u00e4sidentin", "found": false}, {"type": "with", "string": "und arbeitete als wissenschaftliche", "found": true}, {"type": "with", "string": "t\u00fcrkischen Wurzeln am", "found": true}, {"type": "without", "string": "Arbeitsgruppen", "found": false}, {"type": "without", "string": "Bei Fragen und Anregungen", "found": false}, {"type": "without", "string": "Foto: DBT/Stella", "found": false}]}
{"file": "bafa.de-mineraloelabsatz.html", "url": "https://www.bafa.de/SharedDocs/Kurzmeldungen/DE/Energie/Mineraloel/2021_11_mineraloelinfo.html;jsessionid=B01BDCE4530EF0FB9BD52A2652C1F167.2_cid390", "text_len": 1575, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Deutschland im aktuellen Zeitraum", "found": true}, {"type": "with", "string": "32,23", "found": true}, {"type": "with", "string": "die Einfuhr von Roh\u00f6l", "found": true}, {"type": "without", "string": "Mineral\u00f6lstatistik", "found": false}, {"type": "without", "string": "Diese Seite", "found": false}, {"type": "without", "string": "27.01.2022", "found": true}]}
{"file": "correctiv.org.zusage.html", "url": "https://correctiv.org/aktuelles/neue-rechte/2019/05/14/wir-haben-bereits-die-zusage", "text_len": 9636, "tp": 2, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Vorweg: Die beteiligten AfD-Politiker", "found": true}, {"type": "with", "string": "ist heute Abend um 21 Uhr auch im ZDF-Magazin Frontal", "found": true}, {"type": "without", "string": "Alle Artikel zu unseren Recherchen", "found": false}, {"type": "without", "string": "Wir informieren Sie regelm\u00e4\u00dfig zum Thema Neue Rechte", "found": false}, {"type": "without", "string": "Kommentar verfassen", "found": false}, {"type": "without", "string": "weiterlesen", "found": false}]}
{"file": "proplanta.de.erloesobergrenze.html", "url": "https://www.proplanta.de/agrar-nachrichten/energie/bayern-fordert-hoehere-erloesobergrenzen-fuer-bioenergie_article1670823962.html", "text_len": 3650, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wie der Ressortchef am Dienstag ", "found": true}, {"type": "with", "string": "Unterdessen pochte die Leiterin", "found": true}, {"type": "with", "string": "Derweil w\u00fcrde die vorgeschlagene", "found": true}, {"type": "without", "string": "Weitere Artikel zum Thema", "found": false}, {"type": "without", "string": "Kommentierte Artikel", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}]}
{"file": "24ora.com-internationalschol.html", "url": "https://24ora.com/minister-president-presente-ne-trashion-fashion-show-di-international-school/", "text_len": 1493, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "studiantenan a presenta trahenan traha", "found": true}, {"type": "with", "string": "fatal pa e animalnan. Tambe", "found": true}, {"type": "with", "string": "amor pa nos planeta.", "found": true}, {"type": "without", "string": "MAS FOR DI E AUTOR", "found": false}, {"type": "without", "string": "MINISTERIO DI HUSTICIA NO LO TOLERA NINGUN ACTO", "found": false}, {"type": "without", "string": "AFECTA ARUBA TAMBE", "found": false}]}
{"file": "selbstversorger.de-Huhn.html", "url": "https://www.selbstversorger.de/eier-legen-huehner/", "text_len": 6316, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mit Sicherheit kennen Sie das Sprichwort: \u201cIch wollt\u2019 ich", "found": true}, {"type": "with", "string": "Ab wann legen H\u00fchner Eier?", "found": true}, {"type": "with", "string": "Die jeweilige H\u00fchnerrasse spielt in Bezug", "found": true}, {"type": "without", "string": "Atme tief durch bevor du Michaela", "found": false}, {"type": "without", "string": "20 Zeichen, dass ein Herzinfarkt", "found": false}, {"type": "without", "string": "Mann schenkt seiner Freundin eine", "found": false}]}
{"file": "bike-magazin.de-strava.html", "url": "https://www.bike-magazin.de/mtb_news/szene_news/strava-update-poi-bei-routen", "text_len": 2289, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Mitte Januar 2022 hat Strava ein", "found": true}, {"type": "with", "string": "Durch die Kombination der Datenbank", "found": true}, {"type": "with", "string": "Unterwegs kann man spontan", "found": true}, {"type": "without", "string": "Ob Supermarkt, Pumptrack oder", "found": true}, {"type": "without", "string": "Lesen Sie das BIKE Magazin", "found": false}, {"type": "without", "string": "Empfehlungen aus der Redaktion", "found": false}]}
{"file": "leichtathletik.de-erfurt.html", "url": "https://www.leichtathletik.de/news/news/detail/76066-erfurt-maximilian-thorwirth-ueberrascht-auf-1500-meter-distanz", "text_len": 5237, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "mit zwei Topzeiten ihre gute Form", "found": true}, {"type": "with", "string": "h\u00e4tte ich mit dieser Zeit nicht gerechnet.", "found": true}, {"type": "with", "string": "Karlsruhe kam Imke Onnen (Hannover 96)", "found": true}, {"type": "without", "string": "Bildergalerie", "found": false}, {"type": "without", "string": "WEITERE NEWS", "found": false}, {"type": "without", "string": "Trauer um Henning von Papen", "found": false}]}
{"file": "bundeskanzleramt.gv.at-bundesminsterin.html", "url": "https://www.bundeskanzleramt.gv.at/bundeskanzleramt/nachrichten-der-bundesregierung/2022/02/bundesministerin-raab-mit-Laendern-und-unternehmen-frauen-und-familienfreundliche-rahmenbedingungen-gestalten.html", "text_len": 3559, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "damit M\u00fctter selbstverst\u00e4ndlich", "found": true}, {"type": "with", "string": "bei der Vereinbarkeit von Beruf", "found": true}, {"type": "with", "string": "\"dass wir einen gro\u00dfen Gap bei den", "found": true}, {"type": "without", "string": "Nachrichten", "found": false}, {"type": "without", "string": "Datenschutzinformation", "found": false}, {"type": "without", "string": "Direkt zu", "found": false}]}
{"file": "Angus Barbieri. Nie jad\u0142 przez 382 dni - Menway w INTERIA.PL.html", "url": "https://menway.interia.pl/historia/news-angus-barbieri-nie-jadl-przez-382-dni,nId,5222535", "text_len": 2849, "tp": 4, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Angus pochodzi\u0142 ze", "found": true}, {"type": "with", "string": "nie d\u0142u\u017cszy ni\u017c 40 dni.", "found": true}, {"type": "with", "string": "Pocz\u0105tkowo Barbieri znajdowa\u0142", "found": true}, {"type": "with", "string": "cukru oraz mleka.", "found": true}, {"type": "without", "string": "domena publiczna", "found": false}, {"type": "without", "string": "Opuszczony Dom", "found": false}, {"type": "without", "string": " Poniedzia\u0142ek", "found": false}]}
{"file": "fisch-hitparade.de-alkohhol.html", "url": "https://www.fisch-hitparade.de/magazine/alkohol-auf-dem-boot/", "text_len": 5400, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "sodass man dazu geneigt ist,", "found": true}, {"type": "with", "string": "und der F\u00fchrer des Wasserfahrzeugs", "found": true}, {"type": "with", "string": "zwischen 0,5 und 1,09 werden als Ordnungswidrigkeiten", "found": true}, {"type": "without", "string": "Alkohol beim Angeln \u2013 Diskussion im Forum", "found": false}, {"type": "without", "string": "Jetzt teilen!", "found": false}, {"type": "without", "string": "Video: Achtung Kontrolle", "found": false}]}
{"file": "hvw-online.org-zuschauer.html", "url": "https://www.hvw-online.org/aktuell/detail/news/zuschauerrueckkehr-bei-den-proficlubs-der-region", "text_len": 1747, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Heimspiele keine Tickets zu erwerben.", "found": true}, {"type": "with", "string": "G\u00f6ppingen und den TVB Stuttgart geht", "found": true}, {"type": "with", "string": "Beachtung der 2G+-Regelung", "found": true}, {"type": "without", "string": "Schriftgr\u00f6\u00dfe", "found": false}, {"type": "without", "string": "Impressum", "found": false}, {"type": "without", "string": "Fritz-Walter-Weg", "found": false}]}
{"file": "minusl.de.joghurt.html", "url": "https://www.minusl.de/produkt_kategorien/joghurt/", "text_len": 2028, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "wohl, denn MinusL bringt Genuss in mein Leben.", "found": true}, {"type": "with", "string": "generell die Zutatenliste einer Verpackung beachten. Allergene Zutaten ", "found": true}, {"type": "with", "string": "Sie lieben Joghurt mit frischen Fr\u00fcchten un", "found": true}, {"type": "without", "string": "Senden", "found": false}, {"type": "without", "string": "ZUR\u00dcCK", "found": false}, {"type": "without", "string": "MinusL Athentikos", "found": false}]}
{"file": "st-georg.de-olympia.html", "url": "https://www.st-georg.de/news/mehr-sport/pferdesport-definitiv-bei-olympia-2028-dabei/", "text_len": 1239, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dezember kam die Meldung, dass Reiten", "found": true}, {"type": "with", "string": "Sportarten dort zu sehen sein werden. Reiten ist", "found": true}, {"type": "with", "string": "f\u00fcr die Umwelt und die Frage, ob der Sport", "found": true}, {"type": "without", "string": "Tsch\u00fcss, Bauchfett!", "found": false}, {"type": "without", "string": "(FEI/Christophe Taniere)", "found": false}, {"type": "without", "string": "OLYMPISCHE SPIELE", "found": false}]}
{"file": "sonntag-sachsen.de.emanuel.html", "url": "https://www.sonntag-sachsen.de/emanuel-scobel-wird-thomanerchor-geschaeftsfuehrer", "text_len": 2005, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Neuer Gesch\u00e4ftsf\u00fchrender Leiter", "found": true}, {"type": "with", "string": "nach Leipzig wechseln.", "found": true}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "Folgen Sie uns auf Facebook und Twitter", "found": false}, {"type": "without", "string": "Aktuelle Ausgabe", "found": false}]}
{"file": "faz.net.streaming.html", "url": "https://www.faz.net/aktuell/wirtschaft/nutzerbasierte-abrechnung-musik-stars-fordern-neues-streaming-modell-16604622.html", "text_len": 3823, "tp": 2, "fn": 1, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "\u201eDie Liste der K\u00fcnstler", "found": true}, {"type": "with", "string": "nicht blo\u00df um h\u00f6here Eink\u00fcnfte", "found": true}, {"type": "with", "string": "Der Wandel der Musikbranche", "found": false}, {"type": "without", "string": "Etwa 100 deutsche Reisende", "found": false}, {"type": "without", "string": "Abonnieren Sie unsere", "found": false}, {"type": "without", "string": "Joe Kaeser deutet vage", "found": false}, {"type": "without", "string": "Redakteur in der Wirtschaft.", "found": true}]}
{"file": "eltiempo.com-candidatos.html", "url": "https://www.eltiempo.com/colombia/medellin/elecciones-2022-candidatos-presidenciales-en-la-universidad-eafit-669594", "text_len": 4801, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "enmarcado en 6 ejes tem\u00e1ticos relacionados", "found": true}, {"type": "with", "string": "que se llama Neobanco con un bill\u00f3n", "found": true}, {"type": "with", "string": "colectivamente, de acabar con este sistema", "found": true}, {"type": "without", "string": "Necesitamos una renovaci\u00f3n", "found": false}, {"type": "without", "string": "llen\u00f3 de empresas de webcam", "found": true}, {"type": "without", "string": "noticias para ti", "found": false}]}
{"file": "de.creativecommons.org.endlich.html", "url": "https://de.creativecommons.org/index.php/2014/03/20/endlich-wird-es-spannend-die-nc-einschraenkung-nach-deutschem-recht/", "text_len": 1280, "tp": 1, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "das letzte Wort sein kann.", "found": true}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "OERde14", "found": false}, {"type": "without", "string": "Michael Blahm", "found": true}]}
{"file": "modepilot.de.duschkopf.html", "url": "https://www.modepilot.de/2019/05/21/geht-euch-auch-so-oder-auf-reisen-nie-ohne-meinen-duschkopf/", "text_len": 5250, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Allerdings sieht es wie ein Dildo aus,", "found": true}, {"type": "with", "string": "gibt Bescheid, ne?", "found": true}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Deine E-Mail (bleibt nat\u00fcrlich unter uns)", "found": false}]}
{"file": "deutscheweine.de-riesling.html", "url": "https://www.deutscheweine.de/aktuelles/meldungen/details/news/detail/News/rieslingbirthday-posts-gewinnen/", "text_len": 1936, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es gibt zahlreiche \"erste\" Erw\u00e4hnungen", "found": true}, {"type": "with", "string": "zeigen die Verwandtschaft mit Wildreben", "found": true}, {"type": "with", "string": "Instagram-Posts mit dem hashtag", "found": true}, {"type": "without", "string": "MELDUNGEN AUS DEM DWI", "found": false}, {"type": "without", "string": "Downloadbereich", "found": false}, {"type": "without", "string": "UNSERE APP DEUTSCHE WEINE IM APPSTORE", "found": false}]}
{"file": "bsi.de-ki.html", "url": "https://www.bsi.bund.de/DE/Service-Navi/Presse/Pressemitteilungen/Presse2022/220128_Forschungsprojek-KI-Auto_BSI-ZF.html", "text_len": 3436, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "orteile von KI-Systemen in der Mobilit\u00e4t", "found": true}, {"type": "with", "string": "Anforderungen, Methoden und Werkzeuge", "found": true}, {"type": "with", "string": "KI-Systemen in Autos nach allgemein", "found": true}, {"type": "without", "string": "Verbraucherinnen und Verbraucher", "found": false}, {"type": "without", "string": "IT-SICHERHEITSVORFALL", "found": false}, {"type": "without", "string": "FOLGEN SIE UNS", "found": false}]}
{"file": "iwr.de.IWRpressedienst.Nordex.html", "url": "https://www.iwrpressedienst.de/energie-themen/pm-7663-iwes-und-nordex-group-intensivieren-zusammenarbeit-bei-netzintegration-von-windenergieanlagen", "text_len": 8219, "tp": 3, "fn": 0, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "Gemeinsam entwickelter Versuchsstand", "found": true}, {"type": "with", "string": "Michael Franke, Vice President", "found": true}, {"type": "with", "string": "Die Nordex Group im Profil", "found": true}, {"type": "without", "string": "Telefon:", "found": true}, {"type": "without", "string": "Online-Pressemappe", "found": true}, {"type": "without", "string": "- alle Pressemitteilungen der", "found": true}]}
{"file": "7mind.de.grenzen.html", "url": "https://www.7mind.de/magazin/so-lernen-wir-grenzen-zu-setzen", "text_len": 9733, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Sie sind das Fundament der", "found": true}, {"type": "with", "string": "So erkennst du", "found": true}, {"type": "with", "string": "\u00dcbung, \u00dcbung, \u00dcbung", "found": true}, {"type": "without", "string": "Das k\u00f6nnte dich auch interessieren", "found": false}, {"type": "without", "string": "Unsere Inhalte", "found": false}, {"type": "without", "string": "Einloggen", "found": false}]}
{"file": "management-circle.de.glasses.html", "url": "https://www.management-circle.de/blog/remote-support-mit-smart-glasses/", "text_len": 4988, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wie Sie sehen bietet der Remote Support mit Smart Glasses", "found": true}, {"type": "with", "string": "Die Arbeit der Mitarbeiter im Karosseriebau vor Ort wird durch Smart Glasses", "found": true}, {"type": "with", "string": "In der Industrie wird der Remote Support mit Smart Glasses immer beliebter", "found": true}, {"type": "without", "string": "Als Content Marketing Managerin betreue ich", "found": false}, {"type": "without", "string": "Diese neuen Entwicklungen sollten Sie kennen", "found": false}, {"type": "without", "string": "In unserem Seminar \u201eAugmented Reality\u201c erarbeiten Sie anhand verschiedener Experience", "found": false}]}
{"file": "kochbar.de.schneiden.html", "url": "https://www.kochbar.de/tipp/1918/Tomaten-richtig-schneiden.html", "text_len": 1613, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ihr kennt es sicher auch!", "found": true}, {"type": "with", "string": "aber ohne Strunk sieht es auch sch\u00f6ner aus.", "found": true}, {"type": "with", "string": "haften am Fruchtfleisch und und k\u00f6nnen nicht", "found": true}, {"type": "without", "string": "Tipp favorisieren", "found": false}, {"type": "without", "string": "Um den Tipp \"Tomaten richtig schneiden\" kommentieren", "found": false}, {"type": "without", "string": "Die besten TIPPS", "found": false}]}
{"file": "bund.net-hermlin.html", "url": "https://www.bund.net/bund-tipps/detail-tipps/tip/unser-tipp-im-november-das-hermelin/", "text_len": 3249, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Beobachtungstipp", "found": true}, {"type": "with", "string": "Paarungszeit der Hermeline", "found": true}, {"type": "with", "string": "Hermelin ist weit verbreitet", "found": true}, {"type": "without", "string": "Newsletter erhalten", "found": false}, {"type": "without", "string": "iStock.com", "found": false}, {"type": "without", "string": "Unser Tipp im Oktober:", "found": false}]}
{"file": "uebermedien.de-Israel.html", "url": "https://uebermedien.de/89676/gute-tabus-schlechte-tabus-die-vertauschten-rollen-in-der-debatte-ueber-israel/", "text_len": 2984, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Was folgt aus diesen Beobachtungen?", "found": false}, {"type": "with", "string": "Nat\u00fcrlich k\u00f6nnte man sich w\u00fcnschen", "found": false}, {"type": "with", "string": "dass es Verst\u00e4ndnis f\u00fcr das Gegen\u00fcber weckt", "found": false}, {"type": "without", "string": "Aus Solidarit\u00e4t mit Israel verzichtet \u201eBild\u201c darauf", "found": false}, {"type": "without", "string": "\u00fcber pal\u00e4stinensische Opfer in Gaza zu berichten", "found": false}, {"type": "without", "string": "Die Magie der Zuschauer-Call-ins", "found": false}]}
{"file": "internet-law.de.pseudonymen.html", "url": "http://www.internet-law.de/2011/07/verstost-der-ausschluss-von-pseudonymen-bei-google-gegen-deutsches-recht.html", "text_len": 2203, "tp": 1, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wann Blogs einer Impressumspflicht unterliegen,", "found": true}, {"type": "without", "string": "\u00dcber mich", "found": false}, {"type": "without", "string": "Gesetzes- und Rechtsprechungszitate werden automatisch", "found": false}, {"type": "without", "string": "Comment by", "found": false}]}
{"file": "pix-bavaria.de.html", "url": "https://www.pix-bavaria.de/", "text_len": 778, "tp": 0, "fn": 3, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Alle Fotos sind in Aufl\u00f6sungen", "found": false}, {"type": "with", "string": "in der Web-Galerie von", "found": false}, {"type": "with", "string": "Jede andere Art der Bildnutzung", "found": false}, {"type": "without", "string": "Erstellt mit Piwigo", "found": false}, {"type": "without", "string": "Kontakt zu pix-bavaria", "found": false}]}
{"file": "von-der-see.de.design.html", "url": "https://von-der-see.de/design/", "text_len": 2177, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ein professionelles und seri\u00f6s", "found": true}, {"type": "with", "string": "Design geht aber auch weit", "found": true}, {"type": "with", "string": "zahlreiche Bereiche zuverl\u00e4ssig ab", "found": true}, {"type": "without", "string": "Wenn Sie uns per Kontaktformular Anfragen", "found": false}, {"type": "without", "string": "Der Upstalsboom-Weg", "found": false}, {"type": "without", "string": "Interessantes aus unserem", "found": false}]}
{"file": "haenselblatt.com.chinese.html", "url": "https://www.haenselblatt.com/chinese-money-plant-info", "text_len": 2311, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Was ist eine chinesische Geldanlage?", "found": true}, {"type": "with", "string": "Pilea Pflanzenpflege ist relativ minimal", "found": true}, {"type": "with", "string": "Langsam zu vermehren und erst", "found": true}, {"type": "without", "string": "Spinat kann mit einer Reihe von Krankheiten, vor allem", "found": false}, {"type": "without", "string": "Ich bin ein billiger G\u00e4rtner.", "found": false}, {"type": "without", "string": "Haben Sie schon einmal dar\u00fcber nachgedacht", "found": false}]}
{"file": "rtl.de-lockdown.html", "url": "https://www.rtl.de/cms/bericht-bund-und-laender-wollen-lockdown-verlaengern-um-weitere-vier-wochen-4723862.html ", "text_len": 3158, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "bringt die ganze Impfstrategie", "found": true}, {"type": "with", "string": "Wie der \"Business Insider\" unter", "found": true}, {"type": "with", "string": "TVNOW-DOKU: Das Impfdilemma", "found": true}, {"type": "without", "string": "Stefan Boness", "found": false}, {"type": "without", "string": "Zahlen explodieren - Politik pennt?!", "found": false}, {"type": "without", "string": "Wohnen & Haushalt Gutscheine", "found": false}]}
{"file": "ditb.de-Propheten.html", "url": "https://ditib.de/detail1.php?id=765&lang=de", "text_len": 3098, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Mit seinen durch die Schw\u00fcre", "found": true}, {"type": "with", "string": "S\u00fcden und vom Osten", "found": true}, {"type": "with", "string": "Knappheit, sowie in Zeiten", "found": true}, {"type": "without", "string": "Nachrichten und Pressemeldungen", "found": false}, {"type": "without", "string": "Botschaft", "found": true}, {"type": "without", "string": "Twittern", "found": false}]}
{"file": "wir-empfehlen.info.3289.html", "url": "http://wir-empfehlen.info/?p=3289", "text_len": 407, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Seit Anfang 2019 stehen wir", "found": true}, {"type": "with", "string": "Ottostra\u00dfe 14", "found": true}, {"type": "with", "string": " F\u00fcr Spezialfahrzeuge (incl. Viehtransportern)", "found": true}, {"type": "without", "string": "Deine E-Mail-Adresse wird", "found": false}, {"type": "without", "string": "Sei der Erste dem dies gef\u00e4llt.", "found": false}, {"type": "without", "string": "Top Kunden Bewertungen", "found": false}]}
{"file": "creativecommons.org.html", "url": "https://creativecommons.org/about/", "text_len": 1436, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "With a network of", "found": true}, {"type": "with", "string": "Our work is to build", "found": true}, {"type": "with", "string": "Our work spans a variety", "found": true}, {"type": "without", "string": "Connect with Creative Commons", "found": false}, {"type": "without", "string": "Honoring Our Friend", "found": false}, {"type": "without", "string": "In this section", "found": false}]}
{"file": "handwerk-magazin.de-Angriffe.html", "url": "https://www.handwerk-magazin.de/cyber-angriffe-20-prozent-vom-it-budget-in-die-it-sicherheit-stecken-250901/", "text_len": 4606, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Erpressungsmethoden wie Ransomeware fest.\u201c", "found": true}, {"type": "with", "string": "gesichtet, das sind durchschnittlich", "found": true}, {"type": "with", "string": "weshalb das Update noch nicht umgesetzt wurde", "found": true}, {"type": "without", "string": "Steuern Sie Ihren Kundendienst", "found": false}, {"type": "without", "string": "Mission Mittelstand - digitales", "found": false}, {"type": "without", "string": "Cyber-Attacken nehmen weiter zu.", "found": false}]}
{"file": "goodnight.at.konzert.html", "url": "https://goodnight.at/magazin/kultur/3017-konzert-highlights-im-november-2022", "text_len": 4561, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mit dem im August 2022", "found": true}, {"type": "with", "string": "Seit 2012 bringen Kraftklub", "found": true}, {"type": "with", "string": "Ein bisschen Old-School Hip-Hop,", "found": true}, {"type": "without", "string": "Beliebteste Artikel", "found": false}, {"type": "without", "string": "Facebook", "found": false}, {"type": "without", "string": "Mediadaten", "found": false}]}
{"file": "iconmagazine.de.sharonstone.html", "url": "https://iconmagazine.de/story/interview-mit-sharon-stone/", "text_len": 3886, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es gibt Ereignisse, die", "found": false}, {"type": "with", "string": "In welchem seelischen Zustand", "found": false}, {"type": "with", "string": "Ich war zehn Jahre lang", "found": false}, {"type": "without", "string": "INTERVIEW SVEN MICHAELSEN", "found": false}, {"type": "without", "string": "Kontakt", "found": false}, {"type": "without", "string": "Impressum", "found": false}]}
{"file": "0afd671fc2b64f3caa83a91537e8d343.html", "url": "https://telebasel.ch/2019/10/19/junge-lenker-schrotten-corvette-und-audi-in-einer-nacht/?channel=105100", "text_len": 1444, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In der Nacht auf Samstag haben zwei junge Lenker", "found": false}, {"type": "with", "string": "Ein Neulenker ist in der Nacht auf Samstag um 23:50", "found": true}, {"type": "with", "string": "Schweizer schrottet Corvette", "found": true}, {"type": "without", "string": "1 Kommentar", "found": false}, {"type": "without", "string": "Mehr aus dem Channel", "found": false}, {"type": "without", "string": "Fruchtiger Pinot Grigio zu Saiblingsfilet mit Buttermilch-Dashi", "found": false}]}
{"file": "tennisnet.com-ueberraschungen.html", "url": "https://www.tennisnet.com/news/diese-ymers-zwei-ueberraschungen-an-einem-tag", "text_len": 2152, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Montpellier f\u00fcr zwei \u00dcberraschungen gesorgt", "found": true}, {"type": "with", "string": "Drei-Kronen-Team wieder einmal Gespr\u00e4chsthema", "found": true}, {"type": "with", "string": "Mann am Start, der nach seinem fr\u00fchen", "found": true}, {"type": "without", "string": "Hier das Einzel-Tableau in Pune", "found": true}, {"type": "without", "string": "ATP: Aufschlag-H\u00fcne Milos Raonic f\u00e4llt", "found": false}, {"type": "without", "string": "Berlin: GEERS sucht 700", "found": false}]}
{"file": "decohome.de.magenta.html", "url": "https://www.decohome.de/farbe-des-jahres-2023-viva-magenta/", "text_len": 2423, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Als \u201eFaust im Samthandschuh\u201c ", "found": true}, {"type": "with", "string": "Pulsierend, mutig, fr\u00f6hlich,", "found": true}, {"type": "with", "string": "Ob nun als Akzent oder All-over Look", "found": true}, {"type": "without", "string": " Wie finde ich das richtige M\u00f6bel?", "found": false}, {"type": "without", "string": "Marsala, Terrakotta, Ochsenblut, Curry und Co", "found": false}, {"type": "without", "string": "Hat das Sammel-Gen von ihrem Opa geerbt", "found": false}]}
{"file": "kyffhaeuser-nachrichten.de-Regen.html", "url": "https://kyffhaeuser-nachrichten.de/news/news_lang.php?ArtNr=335614", "text_len": 6435, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Statt herk\u00f6mmlichem Herbstwetter brachte", "found": true}, {"type": "with", "string": "der Oktober 2023 sehr viel Regen und eine \u00e4u\u00dferst milde Witterung mit sommerlichen Nuancen", "found": true}, {"type": "with", "string": "Die Vegetation kleidete sich nur z\u00f6gerlich herbstlich", "found": true}, {"type": "without", "string": "Am meisten gelesen...", "found": false}, {"type": "without", "string": "Letzte Kommentare", "found": false}, {"type": "without", "string": "NACHRICHTEN AUS DEM KYFFH\u00c4USERKREIS - REGIONAL, SCHNELL, KOSTENLOS, SUPER DIGITAL", "found": false}]}
{"file": "www1.wdr.de-Correctiv-Recherche.html", "url": "https://www1.wdr.de/nachrichten/correctiv-recherche-deutsche-waffen-fuer-russland-100.html", "text_len": 1499, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Hersteller d\u00fcrfen sie demnach ins Ausland verkaufen", "found": true}, {"type": "with", "string": "weil sie offiziell als Jagd- oder Sportwaffen gelten", "found": true}, {"type": "with", "string": "und deshalb nicht unter das Kriegswaffen-Kontrollgesetz fallen", "found": true}, {"type": "without", "string": "WDR aktuell Whatsapp-Kanal abonnieren - so geht's", "found": false}, {"type": "without", "string": "App-Symbol: WDR aktuellDie App WDR aktuell begleitet Sie durch den Tag", "found": false}, {"type": "without", "string": "Wie wir mit Gendern umgehen", "found": false}]}
{"file": "nalas-loewenseiten.info.m.html", "url": "http://www.nalas-loewenseiten.info/loewen-lexikon/?letter=M", "text_len": 5385, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nur die L\u00f6wenm\u00e4nnchen haben eine", "found": true}, {"type": "with", "string": "Aber es gibt eben nicht nur diese tollen Schnuckll\u00f6wen", "found": true}, {"type": "with", "string": "Und nicht nur dass, wie Peyton West", "found": true}, {"type": "without", "string": "Nala L\u00f6wenk\u00f6nigin", "found": false}, {"type": "without", "string": "Prankentausch", "found": false}, {"type": "without", "string": "Lexikon", "found": false}]}
{"file": "archive.peptalks.de.schulnoten.html", "url": "https://web.archive.org/web/20131110121040/http://www.peptalks.de/haben-sich-mozarts-eltern-wegen-seiner-schulnoten-gesorgt/", "text_len": 9093, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Was meinen Sie", "found": true}, {"type": "with", "string": "Anfang 1762 nach M\u00fcnchen und anschlie\u00dfend", "found": true}, {"type": "with", "string": "Er lebte still und unscheinbar", "found": true}, {"type": "without", "string": "Dichter und Denker zu Schule und Bildung", "found": false}, {"type": "without", "string": "Sie m\u00f6chten gerne automatisch \u00fcber jeden", "found": false}, {"type": "without", "string": "Trage deine Daten unten ein", "found": false}]}
{"file": "furche.at.achtsam.html", "url": "https://www.furche.at/gesellschaft/achtsam-durch-die-krise-2497954", "text_len": 6759, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "gen gen\u00e4hrt wird. Und lebensbedrohlich ist es \u2013 jedenfalls statistisch gesehen, und da die Statistik nichts dar\u00fcb", "found": true}, {"type": "with", "string": "n, verwechseln Achtsamkeit mit Aufmerksamkeit.", "found": true}, {"type": "with", "string": "Achtsamkeit zu \u00fcben, kann man im", "found": true}, {"type": "without", "string": "Im FURCHE-Navigator weiterlesen", "found": false}, {"type": "without", "string": "FURCHE-Newsletter", "found": false}, {"type": "without", "string": "itreisen und neue Perspektiven", "found": false}]}
{"file": "harpers.org.justice.html", "url": "https://harpers.org/a-letter-on-justice-and-open-debate/", "text_len": 8018, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Our cultural institutions are facing a moment of trial", "found": true}, {"type": "with", "string": "expect the public or the state to defend it for us.", "found": true}, {"type": "with", "string": "The free exchange of information and ideas, the", "found": true}, {"type": "without", "string": "Do Not Sell My Personal Information", "found": false}, {"type": "without", "string": "Privacy Policy ", "found": false}, {"type": "without", "string": "Customer Care", "found": false}]}
{"file": "autozeitung.de-adblue.html", "url": "https://www.autozeitung.de/adblue-diesel-tanken-ratgeber-180301.html", "text_len": 7562, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Tankstellen: Wo kann man Adblue kaufen?", "found": true}, {"type": "with", "string": "AdBlue-Tank einfrieren?", "found": true}, {"type": "with", "string": "Diesel d\u00fcrfen seitdem statt", "found": true}, {"type": "without", "string": "Beliebte Marken", "found": false}, {"type": "without", "string": "So kommt die", "found": false}, {"type": "without", "string": "Hefte testen und 35", "found": false}]}
{"file": "gitarrebass.de-dieneue.html", "url": "https://www.gitarrebass.de/dm-native-advert/gitarre-bass-02-2022/", "text_len": 11029, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Und hat einen neuen Signature-Amp", "found": true}, {"type": "with", "string": "hat sich Matthias Mineur mit ihm", "found": true}, {"type": "with", "string": "Vintage-Fender-Telecaster,", "found": true}, {"type": "without", "string": "Alles Gute zum neuen Jahr", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "AKTUELLE AUSGABE", "found": false}]}
{"file": "tell-review.de.heimweh.html", "url": "https://tell-review.de/unstillbares-heimweh/", "text_len": 10027, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In seinem Essay \u201eLob der Melancholie\u201c", "found": false}, {"type": "with", "string": "Schon in seiner ersten Studie Melancholie", "found": true}, {"type": "with", "string": "in immer wiederkehrender Bezugspunkt", "found": true}, {"type": "without", "string": "Gef\u00e4llt Ihnen, was Sie sehen?", "found": false}, {"type": "without", "string": "Benachrichtige mich \u00fcber nachfolgende", "found": false}, {"type": "without", "string": "Freier Autor in Berlin", "found": false}]}
{"file": "creativecommons.at.faircoin.html", "url": "https://www.creativecommons.at/faircoin-hackathon", "text_len": 1556, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir waren massgeblich", "found": true}, {"type": "with", "string": "link is external", "found": true}, {"type": "without", "string": "Publikationen in Forschung", "found": false}, {"type": "without", "string": "Vorheriges", "found": false}, {"type": "without", "string": "Nach fast zwei Jahren Arbeit", "found": false}]}
{"file": "Volksstimme.ch-loehne.html", "url": "https://www.volksstimme.ch/gute-loehne-alleine-reichen-nicht", "text_len": 342, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das Zentrum Ergolz lud zur Gespr\u00e4chsrunde ein", "found": true}, {"type": "with", "string": "Die Teilnehmenden sprachen dar\u00fcber", "found": true}, {"type": "with", "string": "wie Arbeitgeber in Zeiten des Fachkr\u00e4ftemangels gen\u00fcgend Personal finden", "found": true}, {"type": "without", "string": "M\u00f6chten Sie weiterlesen?", "found": false}, {"type": "without", "string": "Ja. Ich bin Abonnent.", "found": false}, {"type": "without", "string": "Ja. Ich ben\u00f6tige ein Abo.", "found": false}]}
{"file": "zfk.de.waermepumpen.html", "url": "https://www.zfk.de/energie/waerme/waermepumpenmarkt-waechst-um-42-prozent-gegenueber-dem-vorjahr", "text_len": 1449, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "W\u00e4rmepumpen boomen", "found": false}, {"type": "with", "string": "Trotz schwieriger", "found": true}, {"type": "with", "string": "Gas r\u00fcckl\u00e4ufig", "found": true}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "ZfK.de > Energie > W\u00e4rme", "found": false}, {"type": "without", "string": "AGB Impressum Datenschutz", "found": false}]}
{"file": "medicalnewstoday.com.318674.html", "url": "https://www.medicalnewstoday.com/articles/318674", "text_len": 5476, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Many of us have noticed that we seem to get our", "found": true}, {"type": "with", "string": "But the exact moment at which information becomes", "found": true}, {"type": "with", "string": " that the brain goes through to complete a", "found": true}, {"type": "without", "string": "myths, and reveal tips for improving brain functioning.", "found": false}, {"type": "without", "string": "to such placement, do not provide the information.", "found": false}, {"type": "without", "string": "\u00a9 2004-2020 Healthline Media UK Ltd, Brighton", "found": false}]}
{"file": "wmn.de.krankheit.html", "url": "https://www.wmn.de/health/body-fitness/staendig-muede-an-diesen-krankheiten-koennte-es-liegen-id459844", "text_len": 3974, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Leidest du an st\u00e4ndiger M\u00fcdigkeit", "found": false}, {"type": "with", "string": "St\u00e4ndige M\u00fcdigkeit kann belastend sein", "found": true}, {"type": "with", "string": "um eine Diagnose zu bekommen,", "found": false}, {"type": "without", "string": "Markiert:", "found": false}, {"type": "without", "string": "Kontakt", "found": false}, {"type": "without", "string": "BODY & FITNESS", "found": false}]}
{"file": "zooroyal.de.trixie.html", "url": "https://www.zooroyal.de/trixie-natura-kleintierstall-mit-freilaufgehege", "text_len": 2370, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "stabilem Kiefernholz gefertigt mit herausziehbarem, kunststoffbeschichtetem Boden.", "found": false}, {"type": "with", "string": "Der Natura Stall l\u00e4sst sich von oben sowie von vorne \u00f6ffnen ", "found": true}, {"type": "with", "string": "verschlie\u00dfbare Bodenluke mit Kunststoffbeschichtung", "found": true}, {"type": "without", "string": "Kleintierheim", "found": false}, {"type": "without", "string": "dass ZooRoyal mir per E-Mail an mich gerichtete Werbung", "found": false}, {"type": "without", "string": "Trixie Kleintierfutter", "found": false}]}
{"file": "foren.myoos.de.html", "url": "https://foren.myoos.de/viewtopic.php?f=4&t=167&sid=58428beaa14598c2e02d93ad5c773e4d", "text_len": 3724, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Freie Software ist Software, die ohne Ansicht der Person", "found": true}, {"type": "with", "string": "http://www.gnu.org/philosophy/free-sw.de.html", "found": true}, {"type": "with", "string": "Software (OSS) ein und entwickeln einen Praxisleitfaden.", "found": true}, {"type": "without", "string": "Forum Software", "found": false}, {"type": "without", "string": "Alle Zeiten sind UTC+02:00", "found": false}, {"type": "without", "string": "Mitglieder in diesem Forum:", "found": false}]}
{"file": "youhadmeatgardening.com.lemon.html", "url": "https://youhadmeatgardening.com/lemon-tree-from-seed", "text_len": 18111, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Now you know how to grow lemon trees", "found": true}, {"type": "with", "string": "for planting lemon seeds has a pH between", "found": true}, {"type": "with", "string": "Place the seeds about one inch apart on a paper", "found": true}, {"type": "without", "string": "Your email address will not be published", "found": false}, {"type": "without", "string": "We can help you grow the indoor", "found": false}, {"type": "without", "string": "apartment gardening. Learn how to stop killing", "found": false}]}
{"file": "taucher.net-tauchmesse.html", "url": "https://taucher.net/diveinside-boot_tulln_2022_abgesagt-kaz8693", "text_len": 1678, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Wassersportler in \u00d6sterreich und", "found": true}, {"type": "with", "string": "Optimismus und damit die Vorfreude", "found": true}, {"type": "with", "string": "Sobald weitere Informationen vorliegen", "found": true}, {"type": "without", "string": "Letzte Artikel", "found": false}, {"type": "without", "string": "Norwegen: Orcas und Buckelwale auf Jagd", "found": false}, {"type": "without", "string": "Kategorie: News", "found": true}]}
{"file": "reset.org.clickbait.html", "url": "https://reset.org/du-wirst-nicht-glauben-wie-viel-co2-clickbait-websites-produzieren/", "text_len": 5208, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Schlagzeilen wie die dieses Artikels", "found": true}, {"type": "with", "string": "Die Studie von Ebiquity und Scope3 legt", "found": true}, {"type": "with", "string": "Im Gegensatz dazu lag der CO2PM f\u00fcr", "found": true}, {"type": "without", "string": "MARKIERT MIT", "found": false}, {"type": "without", "string": "DAS K\u00d6NNTE DICH AUCH INTERESSIEREN", "found": false}, {"type": "without", "string": "MEIST GELESEN", "found": false}]}
{"file": "lanacion.com.ar-jugada.html", "url": "https://www.lanacion.com.ar/politica/jugada-del-oficialismo-para-evitar-que-jxc-avance-con-la-boleta-unica-en-diputados-nid03052022/", "text_len": 5066, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "elecciones nacionales. Lo hizo por medio", "found": true}, {"type": "with", "string": "la infecci\u00f3n por el", "found": true}, {"type": "with", "string": "funci\u00f3n de esta comisi\u00f3n no es tratar la ley", "found": true}, {"type": "without", "string": "una causa por cohecho", "found": false}, {"type": "without", "string": "a una sesi\u00f3n para", "found": true}, {"type": "without", "string": "Sergio Massa, el presidente", "found": false}]}
{"file": "campograndenews.com.br-adolescente.html", "url": "https://www.campograndenews.com.br/cidades/interior/adolescente-encontrada-morta-em-vala-estava-gravida-de-3-meses-confirma-irma", "text_len": 2066, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "intrigante. Conforme a irm\u00e3", "found": true}, {"type": "with", "string": "no momento em que a menina teria", "found": true}, {"type": "with", "string": "Luana na mesma noite do", "found": true}, {"type": "without", "string": "VEJA TAMB\u00c9M", "found": false}, {"type": "without", "string": "Adolescente morta na", "found": false}, {"type": "without", "string": "Nos siga no", "found": false}]}
{"file": "Nowa Zelandia_ p\u0142atny urlop dla rodzic\u00f3w poronionego dziecka. Jak to wygl\u0105da w Polsce_ - Klub Jagiello\u0144ski.html", "url": "https://klubjagiellonski.pl/2021/04/22/nowa-zelandia-platny-urlop-dla-rodzicow-poronionego-dziecka-jak-to-wyglada-w-polsce/", "text_len": 3785, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Trzy dni", "found": true}, {"type": "with", "string": "w \u017cycie w kwietniu.", "found": true}, {"type": "with", "string": "Ustawa Holidays", "found": true}, {"type": "without", "string": "korzystamy z cookies.", "found": false}, {"type": "without", "string": "Czytasz w\u0142a\u015bnie nowy", "found": true}, {"type": "without", "string": "Tw\u00f3j email", "found": false}]}
{"file": "topagrar.com.schnee.solat.html", "url": "https://www.topagrar.com/energie/news/schnee-belastet-module-10558804.html", "text_len": 2342, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Eine Schneedecke auf der", "found": true}, {"type": "with", "string": "Das Gewicht belastet", "found": true}, {"type": "with", "string": "Verschiedene Experten warnen ", "found": true}, {"type": "without", "string": "DIE REDAKTION EMPFIEHLT", "found": false}, {"type": "without", "string": "Meistgelesene Artikel", "found": false}, {"type": "without", "string": "Meistdiskutierte Artikel", "found": false}]}
{"file": "love-hina.ch.0409.html", "url": "http://love-hina.ch/news/0409.html", "text_len": 404, "tp": 1, "fn": 0, "fp": 1, "tn": 1, "details": [{"type": "with", "string": "Kapitel 121 ist", "found": true}, {"type": "without", "string": "Kommentare schreiben", "found": false}, {"type": "without", "string": "19:49", "found": true}]}
{"file": "basicthinking.de.tweets.html", "url": "https://www.basicthinking.de/blog/2018/12/05/erfolgreiche-tweets-zutaten/", "text_len": 14197, "tp": 4, "fn": 0, "fp": 2, "tn": 3, "details": [{"type": "with", "string": "Frank Thelen, Investor", "found": true}, {"type": "with", "string": "Meine Mutter ist jederzeit", "found": true}, {"type": "with", "string": "Female founders must constantly consider", "found": true}, {"type": "with", "string": "Thema des \u00f6ffentlichen Interesses", "found": true}, {"type": "without", "string": "Nach langj\u00e4hriger T\u00e4tigkeit im Ausland", "found": false}, {"type": "without", "string": "Mit Absendung des Formulars willige ich", "found": false}, {"type": "without", "string": "Auch interessant", "found": true}, {"type": "without", "string": "Kommentieren", "found": false}, {"type": "without", "string": "Wir tun jeden Tag, was wir lieben.", "found": true}]}
{"file": "selbermachen.de-wohngewaechshaus.html", "url": "https://selbermachen.de/garten/gartenhaus-selber-bauen/wohngewaechshaus-selber-bauen", "text_len": 4050, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "feuchteres Klima, als in unseren", "found": true}, {"type": "with", "string": "Konstruiert nach dem Prinzip der thermischen", "found": true}, {"type": "with", "string": "Die Traufenprofile werden mit Hilfe", "found": true}, {"type": "without", "string": "Mehr lesen \u00fcber:", "found": false}, {"type": "without", "string": "Fahrradunterstand selber", "found": false}, {"type": "without", "string": "Hochbeet selber bauen -", "found": false}]}
{"file": "mtb-news.de-tubeless.html", "url": "https://www.mtb-news.de/news/reifen-tubeless-montieren/", "text_len": 5487, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "gemacht! Schlauchlose Reifen", "found": true}, {"type": "with", "string": "Dieser muss luftdicht abschliessen", "found": true}, {"type": "with", "string": "Systeme bieten eine h\u00f6here", "found": true}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "120 Kommentare", "found": false}, {"type": "without", "string": "Best of Test: Die besten Bikes 2022", "found": false}]}
{"file": "mluk.brandenburg.de-erlegungspermie.html", "url": "https://mluk.brandenburg.de/mluk/de/aktuelles/presseinformationen/detail/~02-01-2022-land-zahlte-rund-1-4-millionen-euro-erlegungspraemie-fuer-wildschweine-im-jagdjahr-202020#", "text_len": 2953, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "R\u00fcckblickend wurde die allgemeine Erlegungspr\u00e4mie", "found": true}, {"type": "with", "string": "Schwarzwild lag sowohl die Zahl", "found": true}, {"type": "with", "string": "Auszahlung der Bachenpr\u00e4mie m\u00fcssen bis zum 30. April", "found": true}, {"type": "without", "string": "Informationen zur ASP und zur Bachenpr\u00e4mie", "found": false}, {"type": "without", "string": "Weiterf\u00fchrende Informationen", "found": false}, {"type": "without", "string": "Weiterf\u00fchrende Informationen", "found": false}]}
{"file": "dietagespresse.com-halloween.html", "url": "https://dietagespresse.com/halloween-bizarrer-horrorclown-versetzt-oesterreich-in-angst-und-schrecken/", "text_len": 580, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "kichert der irre Horrorclown im 10-sek\u00fcndigen Gruselclip", "found": true}, {"type": "with", "string": "Das bizarre Drohvideo", "found": true}, {"type": "with", "string": "das auf sozialen Medien seine Runden dreht", "found": true}, {"type": "without", "string": "Kostenlos registrieren und weiterlesen", "found": false}, {"type": "without", "string": "Schon registriert? Hier einloggen", "found": false}, {"type": "without", "string": "Was passiert mit meinen Daten?", "found": false}]}
{"file": "exxpress.at-zaehne.html", "url": "https://exxpress.at/zaehne-zusammenbeissen-festspiel-reisen-von-van-der-bellen-kosteten-57-000-euro/", "text_len": 2302, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Kosten f\u00fcr Festspielbesuche des Bundespr\u00e4sidenten", "found": true}, {"type": "with", "string": "finden vor allem die Freiheitlichen zum Z\u00e4hneknirschen", "found": true}, {"type": "with", "string": "Grund: Die Ausfl\u00fcge von Van der Bellen zu den vier Kulturevents haben unfassbare 57.000 Euro gekostet", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "Ihr Beitrag hilft, unsere Berichterstattung noch", "found": false}, {"type": "without", "string": "weiter auszubauen und diese weiterhin kostenlos", "found": false}]}
{"file": "tarnkappe.info-Black.html", "url": "https://tarnkappe.info/artikel/empfehlungen/happy-halloween-hide-me-senkt-kurzfristig-die-preise-282156.html", "text_len": 3966, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das zweij\u00e4hrige Abo kostet ab den 1. November pro Monat nur 2,22 Euro", "found": true}, {"type": "with", "string": "Insgesamt werden f\u00fcr 27 Monate folglich knapp 60 Euro f\u00e4llig", "found": true}, {"type": "with", "string": "Zumindest was die Verschleierung der eigenen IP-Adresse betrifft", "found": true}, {"type": "without", "string": "Kein Bock auf Werbung?", "found": false}, {"type": "without", "string": "Wir auch nicht. Dennoch kannst Du Dir", "found": false}, {"type": "without", "string": "sicher vorstellen, dass hinter dieser Webseite viel Zeit und Arbeit steckt.", "found": false}]}
{"file": "viehbacher.com.steuerrecht.html", "url": "https://viehbacher.com/de/steuerrecht", "text_len": 5074, "tp": 3, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "und wirtschaftlich orientierte Privatpersonen", "found": true}, {"type": "with", "string": "rund um die Uhr.", "found": true}, {"type": "with", "string": "Mensch im Mittelpunkt.", "found": true}, {"type": "without", "string": "Was sind Cookies?", "found": false}]}
{"file": "reddit.com.init.html", "url": "https://www.reddit.com/r/Python/comments/1bbbwk/whats_your_opinion_on_what_to_include_in_init_py/", "text_len": 8325, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Considering a package", "found": true}, {"type": "with", "string": "Import key functions", "found": true}, {"type": "with", "string": "EDIT: Thanks a lot", "found": true}, {"type": "without", "string": "news about the dynamic", "found": false}, {"type": "without", "string": "All rights reserved", "found": false}, {"type": "without", "string": "I see your minesweeper", "found": false}]}
{"file": "cbsnews.com.carolina.html", "url": "https://www.cbsnews.com/news/2020-presidential-election-south-carolina-black-voters-democrats-joe-biden/", "text_len": 4726, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The stakes are high for all of the candidates ahead of Tuesday", "found": true}, {"type": "with", "string": "At a family fun run in the state", "found": true}, {"type": "with", "string": "Asked why she called the group the Reckoning Crew,", "found": true}, {"type": "without", "string": "\u00a9 2020 CBS Interactive Inc. All Rights Reserved.", "found": false}, {"type": "without", "string": "Email", "found": false}, {"type": "without", "string": "Black voters in S.C. on the 2020 Democrats", "found": false}]}
{"file": "abc7news.com-Napa.html", "url": "https://abc7news.com/camp-margaritaville-resort-napa-county-lake-berryessa-hotel-jimmy-buffett/14031465/", "text_len": 2785, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "so I think anyone that wants to do business in this area", "found": true}, {"type": "with", "string": "as an incredible opportunity to make sure", "found": true}, {"type": "with", "string": "it is done fair responsibly", "found": true}, {"type": "without", "string": "Top Stories", "found": false}, {"type": "without", "string": "LIVE STREAMS", "found": false}, {"type": "without", "string": "Building A Better Bay Area", "found": false}]}
{"file": "lexikon.huettenhilfe.de.banane.html", "url": "http://lexikon.huettenhilfe.de/obst/banane.html", "text_len": 10860, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bananen verderben - wie es bestimmt jeder schon erlebt hat", "found": true}, {"type": "with", "string": "Die \"Gro\u00dfe Obstbanane\" und ihre Sorten", "found": true}, {"type": "with", "string": "Wie die Banane nach Europa kam", "found": true}, {"type": "without", "string": "2006 - 2012 huettenhilfe.de", "found": false}, {"type": "without", "string": "N\u00fcsse und Kerne", "found": false}, {"type": "without", "string": "und vieles mehr rund um die K\u00fcche", "found": false}]}
{"file": "tonedeaf.thebrag.com.luboku.html", "url": "https://tonedeaf.thebrag.com/record-of-the-week-luboku-pale-blue-dot-lift-off/", "text_len": 2106, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "It\u2019s no coincidence that the 30 year anniversary of the da", "found": true}, {"type": "with", "string": "Still need convincing on why it\u2019s our top record this week?", "found": true}, {"type": "with", "string": "From its hypnotic synths to its brooding melodies, Luboku takes", "found": true}, {"type": "without", "string": "Grimes releases her new album Miss Anthropocene", "found": false}, {"type": "without", "string": "Grimes has released her fifth album", "found": false}, {"type": "without", "string": "Discover our latest editorial picks", "found": false}]}
{"file": "nationalgeographic.co.uk.goats.html", "url": "https://www.nationalgeographic.co.uk/environment-and-conservation/2020/01/ravenous-wild-goats-ruled-island-over-century-now-its-being", "text_len": 6817, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "an imposing piece", "found": true}, {"type": "with", "string": "Once the goats and rats", "found": true}, {"type": "with", "string": "But they don\u2019t know the work", "found": true}, {"type": "without", "string": "Photograph by", "found": false}, {"type": "without", "string": "Find More Information", "found": false}, {"type": "without", "string": "What it\u2019s like to live", "found": false}]}
{"file": "nh24.de-Bundeswehr.html", "url": "https://nh24.de/2023/11/06/mitarbeiter-fordern-bundeswehr-auftraege-fuer-deutsche-unternehmen/#more-244202", "text_len": 1845, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Bef\u00fcrchtung der Besch\u00e4ftigten resultiert", "found": true}, {"type": "with", "string": "aus der vermehrten Beschaffung von Flugzeugen", "found": true}, {"type": "with", "string": "und Hubschraubern f\u00fcr die Bundeswehr aus US-Produktion", "found": true}, {"type": "without", "string": "PLAG-ADVENTS-ANGEBOT", "found": false}, {"type": "without", "string": "BESTATTUNGSHAUS WILLE IN KN\u00dcLLWALD", "found": false}, {"type": "without", "string": "SCHUHHAUS HERCHE R\u00c4UMUNGSVERKAUF", "found": false}]}
{"file": "knowtechie.com.rally.html", "url": "https://knowtechie.com/rocket-pass-4-in-rocket-league-brings-with-it-a-new-rally-inspired-car/", "text_len": 2073, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Rocket Pass 4 will begin at 10:00 a.m. PDT", "found": true}, {"type": "with", "string": "Let us know down below in the comments", "found": true}, {"type": "with", "string": "Holy shit, Mortal Kombat 11", "found": true}, {"type": "without", "string": "Related Topics", "found": false}, {"type": "without", "string": "You can keep up with me on Twitter", "found": false}, {"type": "without", "string": "Hit the track today with Mario Kart Tour", "found": false}]}
{"file": "limespace.de.entloeten.html", "url": "https://www.limespace.de/2019/10/22/professionell-entloeten-so-machen-sie-alte-elektrogeraete-wieder-einsatzbereit/", "text_len": 3812, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Haushaltsger\u00e4te, die verr\u00fccktspielen", "found": true}, {"type": "with", "string": "das Verzinnen der Pins", "found": true}, {"type": "with", "string": "Entl\u00f6tstation und einigen Handgriffen", "found": true}, {"type": "without", "string": "Diese Website verwendet Akismet", "found": false}, {"type": "without", "string": "Das k\u00f6nnte Dich auch interessieren \u2026", "found": false}, {"type": "without", "string": "Werbepause", "found": false}]}
{"file": "amazedmag.de.meinleben.html", "url": "https://www.amazedmag.de/white-passing-oder-mein-leben-irgendwo-dazwischen/", "text_len": 9516, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich wollte diesen Text schon", "found": true}, {"type": "with", "string": "Heute sehe ich das anders.", "found": true}, {"type": "with", "string": "\u201eDa wo du herkommst, bin ich zu wei\u00df", "found": true}, {"type": "without", "string": "Sharing is caring", "found": false}, {"type": "without", "string": "\u00c4hnliche Artikel", "found": false}, {"type": "without", "string": "ABOUT", "found": false}]}
{"file": "taz.de.siemens.html", "url": "https://taz.de/Siemens-und-die-Kohlemine-Adani/!5655255/", "text_len": 4392, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ein paar Konsument*innen m\u00f6gen", "found": true}, {"type": "with", "string": "Einige von ihnen, etwa Axa", "found": true}, {"type": "with", "string": "ei potenziellen Kund*innen aus der fossilen Industrie", "found": true}, {"type": "without", "string": "Hinter jedem Klick auf taz.de", "found": false}, {"type": "without", "string": "Schreibt seit 2008 f\u00fcr die taz", "found": false}, {"type": "without", "string": "Bitte registrieren Sie sich und halten Sie sich", "found": false}]}
{"file": "chadim.net.schreibstil.html", "url": "https://chadim.net/text-planung/der-schreibstil", "text_len": 899, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Beim Schreiben Ihrer Texte", "found": true}, {"type": "with", "string": "Fremd- und Modew\u00f6rtern", "found": true}, {"type": "with", "string": "an Ihren Lesern vorbeischreiben", "found": true}, {"type": "without", "string": "Angemeldet bleiben", "found": false}, {"type": "without", "string": "... weiter zu \"die Wortwahl\"", "found": true}, {"type": "without", "string": "Aktuelle Seite:", "found": false}]}
{"file": "rueda.wikidot.com.enchufla.html", "url": "http://rueda.wikidot.com/enchufla", "text_len": 6416, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Platzwechsel, langsam erkl\u00e4rt", "found": true}, {"type": "with", "string": "Start, wenn man rechts auf rechts ist", "found": true}, {"type": "with", "string": "zieht die Folgende den F\u00fchrenden an der H\u00fcfte zur\u00fcck", "found": true}, {"type": "without", "string": "Unless otherwise stated, the content of this page", "found": false}, {"type": "without", "string": "Other interesting sites", "found": false}, {"type": "without", "string": "Ansagen nach Grundschritt", "found": false}]}
{"file": "archive.org.swap-stop.org.shuji.html", "url": "https://web.archive.org/web/20181206101316/https://swap-stop.org/de/filmswap/zusammenarbeit-shuji-walter-april-2018-i/", "text_len": 348, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Fuji X-TRA 400.", "found": true}, {"type": "with", "string": "Walter: PENTAX Z-1", "found": true}, {"type": "with", "string": "Belichtungsfolge", "found": true}, {"type": "without", "string": "Wird geladen", "found": false}, {"type": "without", "string": "Teilen mit:", "found": false}, {"type": "without", "string": "(c) 2016", "found": false}]}
{"file": "erzbstbstum-koeln.de-halskrankheiten.html", "url": "https://www.erzbistum-koeln.de/presse_und_medien/magazin/Blasius-Segen-Schutz-vor-Halskrankheiten/", "text_len": 3595, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "der bekanntesten Legende soll", "found": true}, {"type": "with", "string": "ab dem Vorabend des Gedenktages des hl. Blasius", "found": true}, {"type": "with", "string": "Gott Mensch geworden ist, will uns", "found": true}, {"type": "without", "string": "Radiobeitrag zum Blasius-Segen", "found": false}, {"type": "without", "string": "Der Valentinstag am 14. Februar ist der", "found": false}, {"type": "without", "string": "Live-\u00dcbertragungen der Hl.", "found": false}]}
{"file": "pinkstinks.de-Kulturtechnik.html", "url": "https://pinkstinks.de/das-patriarchat-als-kulturtechnik/", "text_len": 6717, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zum einen sind wir hier nicht in einem Proseminar Soziologie.", "found": true}, {"type": "with", "string": "Zum anderen haben Soziologinnen wie Eva Cyba mit Geschlecht und soziale Ungleichheit", "found": true}, {"type": "with", "string": "Existenz und Wirkweise des Patriarchats sehr viel deutlicher herausgearbeitet als Max Weber", "found": true}, {"type": "without", "string": "FOLGT UNS!", "found": false}, {"type": "without", "string": "AKTUELLE BEITR\u00c4GE", "found": false}, {"type": "without", "string": "\u00c4HNLICHE BEITR\u00c4GE", "found": false}]}
{"file": "archive.org.medialepfade.de.medienpaedagogin.html", "url": "https://web.archive.org/web/20160820205919/http://www.medialepfade.de/2016/01/medienpaedagogin-in-muenchen-gesucht/", "text_len": 2381, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Web-Video, Online-Journalismus, sowie ePartizipation, Games und Open Education. Unser inhaltlicher Schwerpun", "found": true}, {"type": "with", "string": "Professionalit\u00e4t und Souver\u00e4nit\u00e4t im Umgang mit Partnern und F\u00f6rderern", "found": true}, {"type": "with", "string": "ngabe des m\u00f6glichen Eintrittstermins bis zum 01. Februar 2016 an", "found": true}, {"type": "without", "string": "lauff\u00e4higes Wifi, angetrieben durch ein Fahrrad, um zum Umweltschutz zu animieren @jhacktost https://t.co/8elCKJjm3o", "found": false}, {"type": "without", "string": "Blog-Themen:", "found": false}, {"type": "without", "string": "M\u00f6chten Sie unseren Newsletter erhalten?", "found": false}]}
{"file": "siegessaeule.de-Machtinstrument.html", "url": "https://www.siegessaeule.de/magazin/p%C3%A4dophilie-als-politisches-machtinstrument/", "text_len": 8363, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dabei gab es dort keine Bef\u00fcrwortung", "found": true}, {"type": "with", "string": "wie etwa die QAnon-Erz\u00e4hlung", "found": true}, {"type": "with", "string": "Wir haben auch heute noch keinen Weg", "found": true}, {"type": "without", "string": "Peter Rehberg: \u201eSchwule glauben, sich", "found": false}, {"type": "without", "string": "KULTUR", "found": false}, {"type": "without", "string": "Bild: Stefan M\u00fcller", "found": false}]}
{"file": "maenner.media-church.html", "url": "https://www.maenner.media/gesellschaft/community/interview-mit-rainer-teuber-outinchurch/", "text_len": 2929, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "den Besucherservice. Er ist schwul", "found": true}, {"type": "with", "string": "Was m\u00fcsste sich in den Bist\u00fcmern", "found": true}, {"type": "with", "string": "\u00dcber das Rogate-Kloster: Eine", "found": true}, {"type": "without", "string": "HuK (Homosexuelle und Kirche)", "found": false}, {"type": "without", "string": "Der Einsatz f\u00fcr die Menschenrechte ist", "found": false}, {"type": "without", "string": "Kostenloser Download:", "found": false}]}
{"file": "agrarheute.com.abfallholz.html", "url": "https://www.agrarheute.com/energie/heizen-abfallholz-erfindung-funktioniert-601129", "text_len": 2284, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Auch d\u00fcnne \u00c4ste", "found": false}, {"type": "with", "string": "Zun\u00e4chst steckt er die", "found": true}, {"type": "with", "string": "Die Hydraulikpresse im Inneren", "found": true}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "Hier ist Ihre Meinung gefragt", "found": false}, {"type": "without", "string": "Wir informieren Sie t\u00e4glich", "found": false}]}
{"file": "baumeister.de.sportzentrum.html", "url": "https://www.baumeister.de/sportzentrum-kerenzerberg-filzbach/", "text_len": 703, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Am S\u00fcdufer des Walensees", "found": true}, {"type": "with", "string": "Das Sportzentrum erhielt auch", "found": false}, {"type": "with", "string": "Im Bestand liegt der Schwerpunkt", "found": false}, {"type": "without", "string": "Nicht aus den Siebzigern", "found": false}, {"type": "without", "string": "NAPURS MUSEUM OF ETHNOGRAPHY BUDAPEST, FOTO: PALK\u00d3 GY\u00d6RGY - ", "found": false}, {"type": "without", "string": "Napur Marcel Ferencz Kultur", "found": false}]}
{"file": "elavegan.com-Peanut.html", "url": "https://elavegan.com/peanut-butter-truffles/", "text_len": 0, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "If you\u2019re obsessed with peanut butter", "found": false}, {"type": "with", "string": "and looking for a treat that will stop you", "found": false}, {"type": "with", "string": "from sticking your spoon directly into the jar (guilty!)", "found": false}, {"type": "without", "string": "AMAZON ASSOCIATES DISCLOSURE", "found": false}, {"type": "without", "string": "5 Secrets to Healthy Vegan Cooking", "found": false}, {"type": "without", "string": "EXPLORE MORE", "found": false}]}
{"file": "zdf.de.corona.html", "url": "https://www.zdf.de/sport/us-sport-corona-100.html", "text_len": 1923, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "New York ist das Epizentrum der Corona-Pandemie", "found": true}, {"type": "with", "string": " Auch der Sport ist zum Stillstand", "found": true}, {"type": "with", "string": "Die Anteilnahme in den Top-Ligen ist gro\u00df. Wie es ", "found": true}, {"type": "without", "string": "Video verf\u00fcgbar bis 28.02.2021", "found": true}, {"type": "without", "string": "Auch interessant", "found": false}, {"type": "without", "string": "ZDF Unternehmen", "found": false}]}
{"file": "gnaur.wordpress.com.moglichkeit.html", "url": "https://gnaur.wordpress.com/2013/06/14/die-moglichkeit-nichts-zu-tun-ist-auch-eine-moglichkeit/", "text_len": 251, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u201eIch wei\u00df ich bin", "found": true}, {"type": "with", "string": "\u2013 \u201eOk.\u201c", "found": true}, {"type": "with", "string": "sollte das vielleich", "found": true}, {"type": "without", "string": "Kommentar verfassen", "found": false}, {"type": "without", "string": "Die Inhalte dieser Website sind", "found": false}, {"type": "without", "string": "Kategorien", "found": false}]}
{"file": "pointofsail-kiel.de.wilson.html", "url": "http://www.pointofsail-kiel.de/artikel/ben-wilson-surf.html", "text_len": 951, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "So manch einer der eingefleischten", "found": true}, {"type": "with", "string": "We are 100% committed to", "found": true}, {"type": "with", "string": "Our search for perfection never ends", "found": true}, {"type": "without", "string": "Bei uns wirst du frei nach dem Motto", "found": false}, {"type": "without", "string": "Folge uns auch in den sozialen", "found": false}, {"type": "without", "string": "Kontakt", "found": false}]}
{"file": "denkanstoos.com.2012.html", "url": "https://denkanstoos.wordpress.com/2012/04/11/denkanstoos-april-2012/", "text_len": 509, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Moderator: Hass Chapman", "found": true}, {"type": "with", "string": "Two or three 10-15 min", "found": true}, {"type": "with", "string": "What type? Etc. (30 mins)", "found": true}, {"type": "without", "string": "Dieser Eintrag wurde ver\u00f6ffentlicht", "found": false}, {"type": "without", "string": "Mit anderen Teillen", "found": false}, {"type": "without", "string": "In \"DenkanStoos-Treffen\"", "found": false}]}
{"file": "otto.de.twoforfashion.html", "url": "https://www.otto.de/twoforfashion/strohtasche/", "text_len": 3861, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Ob rund oder kastenf\u00f6rmig, ob dezent oder auff\u00e4llig", "found": true}, {"type": "with", "string": "XX, Die Redaktion", "found": true}, {"type": "without", "string": "Kommentieren", "found": false}, {"type": "without", "string": "Dienstag, 4. Juni 2019", "found": false}]}
{"file": "oekonomenstimme.org.keynes.html", "url": "https://www.oekonomenstimme.org/artikel/2015/01/eine-realistische-interpretation-des-keynes-hicks-multiplikators/", "text_len": 10322, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In seinem Beitrag von 5. Januar 2015 er\u00f6rtert Wolfgang", "found": true}, {"type": "with", "string": "Wirtschaftsdienst, 92. Jahrgang, Heft 10, Oktober 2012", "found": true}, {"type": "with", "string": "Erfasst werden. Dabei steht T f\u00fcr den technologischen Fortschritt", "found": true}, {"type": "without", "string": "Die paradigmatische Struktur der Makro\u00f6konomik", "found": false}, {"type": "without", "string": "um Kommentare zu schreiben", "found": false}, {"type": "without", "string": "Faktor Arbeit im Sinkflug", "found": false}]}
{"file": "baechli-bergsport.ch-lawinen.html", "url": "https://www.baechli-bergsport.ch/Blog/Einblick-in-die-Praxis-und-Theorie-von-Lawinen-De-9-9-9-9-1.htm", "text_len": 21490, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "wir bestens vorbereitet sind,", "found": true}, {"type": "with", "string": "Knie in die H\u00fcfte bis in den", "found": true}, {"type": "with", "string": "langsam sein und im Nachhinein", "found": true}, {"type": "without", "string": "Abbildung 4: klassische Schwachschicht.", "found": true}, {"type": "without", "string": "TEILE DIESEN BEITRAG AUF", "found": false}, {"type": "without", "string": "Vorgehensweise f\u00fcr grosse Ereignisse", "found": true}]}
{"file": "caktusgroup.com.django.html", "url": "https://www.caktusgroup.com/blog/2015/06/08/testing-client-side-applications-django-post-mortem/", "text_len": 5762, "tp": 5, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Was I losing my mind?", "found": true}, {"type": "with", "string": "being cached after their first access.", "found": true}, {"type": "with", "string": "Finding a Fix", "found": true}, {"type": "with", "string": "from django.conf import settings", "found": true}, {"type": "with", "string": "Clear the cache versions", "found": true}, {"type": "without", "string": "Mark Lavin", "found": false}, {"type": "without", "string": "New Call-to-action", "found": false}, {"type": "without", "string": "You might also like:", "found": false}, {"type": "without", "string": "Get tips, see case studies", "found": false}]}
{"file": "tagesanzeiger.ch.umweltzerstoerung.html", "url": "https://www.tagesanzeiger.ch/wie-umweltzerstoerung-neue-epidemien-beguenstigt-633956751547", "text_len": 8160, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dichter Rauch hing im Herbst des Jahres 1997", "found": true}, {"type": "with", "string": "es kann auch von Mensch zu Mensch weitergegeben werden.", "found": true}, {"type": "with", "string": "Im Wesentlichen geht es da aber um Fragen der Wirtschaft und", "found": true}, {"type": "without", "string": "Aktualisiert:", "found": false}, {"type": "without", "string": "03.04.2020", "found": false}, {"type": "without", "string": "All Rights Reserved", "found": false}]}
{"file": "domradio.de-Reformstau.html", "url": "https://www.domradio.de/themen/laien/2021-11-19/reformstau-loesen-irme-stetter-karp-ist-neue-zdk-praesidentin", "text_len": 7748, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "votierten 41 Delegierte.", "found": true}, {"type": "with", "string": "F\u00fcr Reformen k\u00e4mpfen", "found": true}, {"type": "with", "string": "Stil des ZdK-Pr\u00e4sidiums.", "found": true}, {"type": "without", "string": "Logo des Zdk", "found": false}, {"type": "without", "string": "Nach oben", "found": false}, {"type": "without", "string": "Zentralkomitee der", "found": true}]}
{"file": "lady50plus.de.sekre.html", "url": "https://lady50plus.de/2019/06/19/sekre-mystery-bag/", "text_len": 6134, "tp": 3, "fn": 2, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "ist eine echte Luxushandtasche", "found": true}, {"type": "with", "string": "Insgesamt 160 weibliche \u201eDesignerinnen\u201c", "found": true}, {"type": "with", "string": "Sei herzlich gegr\u00fc\u00dft", "found": false}, {"type": "with", "string": "Ein Mann alleine h\u00e4tte niemals", "found": false}, {"type": "with", "string": "in den Bann ziehen!", "found": true}, {"type": "without", "string": "Erforderliche Felder sind mit", "found": false}, {"type": "without", "string": "Benachrichtige mich", "found": false}, {"type": "without", "string": "Reisen ist meine gro\u00dfe Leidenschaft", "found": false}, {"type": "without", "string": "Styling Tipps f\u00fcr Oktober", "found": false}]}
{"file": "greator.com.innerezufriedenheit.html", "url": "https://greator.com/innere-zufriedenheit/", "text_len": 7022, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Innere Zufriedenheit ist ein wichtiger Faktor ", "found": true}, {"type": "with", "string": "10 Tipps f\u00fcr innere Zufriedenheit:", "found": true}, {"type": "with", "string": "Fazit", "found": true}, {"type": "without", "string": "Themen", "found": false}, {"type": "without", "string": "Greator Newsletter", "found": false}, {"type": "without", "string": "Artikel gefallen? Vergiss nicht zu teilen!", "found": false}]}
{"file": "thebalance.com.coinbase.html", "url": "https://www.thebalance.com/coinbase-vs-coinbase-pro-5116733", "text_len": 14833, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Coinbase and Coinbase Pro are two of the most popular cryptocurrency exchanges", "found": true}, {"type": "with", "string": " At a Glance ", "found": false}, {"type": "with", "string": "1 GBP withdrawal", "found": true}, {"type": "without", "string": "Jacob Wade is a personal finance expert", "found": false}, {"type": "without", "string": "Kraken vs. Coinbase", "found": false}, {"type": "without", "string": "We recommend the best products", "found": true}]}
{"file": "shabka.org.about.html", "url": "https://shabka.org/about-us/", "text_len": 4030, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "The Future Strategists Hub 2018 was Shabka\u2019s", "found": true}, {"type": "with", "string": "on several levels as well as supra-instutional", "found": true}, {"type": "with", "string": "One of the book project\u2019s key", "found": true}, {"type": "without", "string": "\u00a9 Shabka 2019", "found": false}, {"type": "without", "string": "Contact", "found": false}]}
{"file": "qualisys.eu.gefahrstoff.html", "url": "http://www.qualisys.eu/gefahrstoff-service", "text_len": 5110, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Qualisys ist spezialisiert auf die Optimierung des Gefahrstoffmanagements", "found": true}, {"type": "with", "string": "SUMDAT Desktop im Format eines Sicherheitsdatenblattes", "found": true}, {"type": "with", "string": "Das Qualisys Gefahrstoff-Backoffice erf\u00fcllt alle Anforderungen", "found": true}, {"type": "without", "string": "D-40764 Langenfeld", "found": false}, {"type": "without", "string": "Kontakt", "found": false}]}
{"file": "mindmegette.hu.levagott.html", "url": "https://www.mindmegette.hu/levagott-ujj-vajas-kekszek-halloweenra-59841/", "text_len": 3563, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Szeretem, hogy a k\u00f6zelg\u0151 t\u00e9li h\u00f3napokat", "found": true}, {"type": "with", "string": "Ezen az \u00e9jszak\u00e1n nagy bulikat szerveznek, ahol", "found": true}, {"type": "with", "string": "azonnal, vagy t\u00e1roljuk \u0151ket j\u00f3l z\u00e1r\u00f3d\u00f3 dobozban", "found": true}, {"type": "without", "string": "Ezek is \u00e9rdekelhetnek", "found": false}, {"type": "without", "string": "Receptek karfiollal", "found": false}, {"type": "without", "string": "Friss receptjeink", "found": false}]}
{"file": "theverge.com.ios13.html", "url": "https://www.theverge.com/2019/7/3/20680681/ios-13-beta-3-facetime-attention-correction-eye-contact", "text_len": 1990, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Normally, video calls tend to", "found": true}, {"type": "with", "string": "across both the eyes and nose.", "found": true}, {"type": "with", "string": "Added ARKit explanation and tweet.", "found": true}, {"type": "without", "string": "Singapore\u2019s public health program", "found": false}, {"type": "without", "string": "Command Line delivers daily updates", "found": false}]}
{"file": "ethify.org.vegetarier.html", "url": "https://ethify.org/content/vegetarier-zu-sein-bedarf-trend-oder-eigene-entscheidung", "text_len": 3433, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Vegetarier zu sein. Bedarf, Trend", "found": true}, {"type": "with", "string": "In \u00d6sterreich sind momentan", "found": true}, {"type": "with", "string": "vor 5 Jahren fast keine", "found": true}, {"type": "without", "string": "Wachstum im Wandel", "found": false}, {"type": "without", "string": "Mit unserem Newsletter", "found": false}, {"type": "without", "string": "communities 2010 - 2020", "found": false}]}
{"file": "schneems.com.rubocop.html", "url": "https://www.schneems.com/2018/10/09/pair-with-me-rubocop-cop-that-detects-duplicate-array-allocations/", "text_len": 6374, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "You might know rubocop", "found": true}, {"type": "with", "string": "You can use this code:", "found": true}, {"type": "with", "string": "While it might not", "found": true}, {"type": "without", "string": "Join the hundreds of developers", "found": false}, {"type": "without", "string": "I maintain an internal-facing", "found": false}, {"type": "without", "string": "Today I have an unusual proposition", "found": false}]}
{"file": "de.happycoffee.org.sidamo.html", "url": "https://de.happycoffee.org/collections/shop/products/happy-coffee-sidamo-bio-kaffeebohnen", "text_len": 1244, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Rote Beeren, Zitrusnoten, s\u00fc\u00dflich", "found": true}, {"type": "with", "string": "Handgepfl\u00fcckt, gewaschen, sonnengetrocknet", "found": true}, {"type": "with", "string": "Alle Kaffees von Happy Coffee sind bio-zertifiziert", "found": true}, {"type": "without", "string": "Jetzt mit 10% Dauerrabatt", "found": false}, {"type": "without", "string": "Unsere Kaffees", "found": false}, {"type": "without", "string": "Frisch ger\u00f6steter Kaffee nach Hause geliefert", "found": false}]}
{"file": "verfassungsblog.de.expertinnen.html", "url": "https://verfassungsblog.de/expertinnen-in-der-krise/", "text_len": 12128, "tp": 3, "fn": 0, "fp": 1, "tn": 5, "details": [{"type": "with", "string": "Die verfassungsrechtswissenschaftliche Begleitung", "found": true}, {"type": "with", "string": "Selbstgewissheit abr\u00fcsten", "found": true}, {"type": "with", "string": "eine besondere Vorbildfunktion.", "found": true}, {"type": "without", "string": "is a Professor of Public", "found": false}, {"type": "without", "string": "I know that I may withdraw my consent", "found": false}, {"type": "without", "string": "If you enjoyed reading this post", "found": true}, {"type": "without", "string": "VerfBlog", "found": false}, {"type": "without", "string": "Comments under pseudonym are allowed", "found": false}, {"type": "without", "string": "European constitutional space and beyond.", "found": false}]}
{"file": "kleinegruenemonster.wordpress.com.start.html", "url": "https://kleinegruenemonster.wordpress.com/2016/01/01/ein-entspannter-start-ins-neue-jahr-2016-be-happy/", "text_len": 1764, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "geht es um Themen wie Entspannung, Meditation und Wellness, aber auch Essen, Leben und Fitness.", "found": true}, {"type": "with", "string": "Man zieht Bilanz. Was hat das vergangene Jahr gebracht?", "found": true}, {"type": "with", "string": "Wer, verdammt noch mal, hat die 40 Stunden Arbeitswoche erfunden?", "found": true}, {"type": "without", "string": "r unter Namensnennung bzw. Linksetzung. Danke.", "found": false}, {"type": "without", "string": "Benachrichtigungen \u00fcber neue Beitr\u00e4ge zu", "found": false}, {"type": "without", "string": " Verwendung, Vervielf\u00e4ltigung und Weitergabe der Inhalte", "found": false}]}
{"file": "kath.net-Menschensohn.html", "url": "https://kath.net/news/76785", "text_len": 6325, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "da sammeln sich auch", "found": true}, {"type": "with", "string": "haupts\u00e4chlich der orthodoxen", "found": true}, {"type": "with", "string": "Die scheinbare Verherrlichung", "found": true}, {"type": "without", "string": "(Weihe-)Alter", "found": false}, {"type": "without", "string": "Bistum Hildesheim: Das", "found": false}, {"type": "without", "string": "meist-diskutiert", "found": true}]}
{"file": "fem.com.gehaelter.html", "url": "https://www.fem.com/beauty-lifestyle/warum-wir-anfangen-muessen-mehr-ueber-gehaelter-zu-sprechen", "text_len": 3660, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es ist schon sehr deutsch,", "found": true}, {"type": "with", "string": "Offenheit gegen ungleiche Geh\u00e4lter", "found": true}, {"type": "with", "string": "Weil Chefs das nat\u00fcrlich gar", "found": true}, {"type": "without", "string": "MEHR ZUM THEMA JOB UND KARRIERE", "found": false}, {"type": "without", "string": "INSTAGRAM", "found": false}, {"type": "without", "string": "AM H\u00c4UFIGSTEN GELESEN", "found": false}]}
{"file": "datev-magazin.de-kommunikation.html", "url": "https://www.datev-magazin.de/archiv/sichere-und-digitale-mandantenkommunikation-73813", "text_len": 1418, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Vorteilen eines sicheren und durchg\u00e4ngig", "found": true}, {"type": "with", "string": "Registrierung ist die WebAkte innerhalb", "found": true}, {"type": "with", "string": "weitere Informationen erhalten", "found": true}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Meistgelesene Artikel", "found": false}, {"type": "without", "string": "Aktuelle Meldungen", "found": false}]}
{"file": "it-learner.de.autotuning.html", "url": "https://it-learner.de/wenn-das-netzwerk-unter-windows-10-sehr-langsam-ist-koennte-das-abschalten-der-autotuning-funktion-abhilfe-schaffen/", "text_len": 1328, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mit Windows Vista wurde damals die sogenannte Autotuning Funktion", "found": true}, {"type": "with", "string": "netsh interface tcp set global autotuninglevel=normal", "found": true}, {"type": "with", "string": "Jedoch gibt es anscheinend Probleme mit \u00e4lteren Routern", "found": true}, {"type": "without", "string": "Hole dir jetzt das kostenlose Ebook.", "found": false}, {"type": "without", "string": "2 Kommentare", "found": false}, {"type": "without", "string": "Zappen ... R\u00e4tsel : entdeckt", "found": false}]}
{"file": "outdoor-magazin.com-vanlife.html", "url": "https://www.outdoor-magazin.com/outdoor-szene/vanlife-in-schweden/", "text_len": 8384, "tp": 3, "fn": 0, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "Der Traum vieler Vanlife- und", "found": true}, {"type": "with", "string": "Teilnehmern gilt die 2G-Regel", "found": true}, {"type": "with", "string": "Schweden unz\u00e4hlige legale", "found": true}, {"type": "without", "string": "Das Wasser aus B\u00e4chen und Fl\u00fcssen", "found": true}, {"type": "without", "string": "Die Alstadt Stockholms", "found": true}, {"type": "without", "string": "Weitere Tourentipps", "found": true}]}
{"file": "ultimahora.com-apelacion.html", "url": "https://www.ultimahora.com/tribunal-apelacion-confirma-la-ejecucion-la-condena-la-secretaria-vip-n2999922.html", "text_len": 4021, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "la Corte Suprema de Justicia,", "found": true}, {"type": "with", "string": "el pedido y esto fue apelado por la defensa", "found": true}, {"type": "with", "string": "de honorarios a 23 meses con la suspensi\u00f3n", "found": true}, {"type": "without", "string": "Asunci\u00f3n: Tras ola", "found": false}, {"type": "without", "string": " marihuana que", "found": false}, {"type": "without", "string": "Dej\u00e1 tu comentario", "found": false}]}
{"file": "phys.org.tool.html", "url": "https://phys.org/news/2019-10-flint-flake-tool-partially-birch.html", "text_len": 2204, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Prior work has turned up", "found": true}, {"type": "with", "string": "the North Sea for most of its existence", "found": true}, {"type": "without", "string": "Explore further", "found": false}, {"type": "without", "string": "Feedback to editors", "found": false}, {"type": "without", "string": "the very first glue", "found": false}]}
{"file": "elperuanoa.pe-logran.html", "url": "https://elperuano.pe/noticia/152832-logran-evacuar-a-otros-50-civiles", "text_len": 560, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "ni\u00f1os y ancianos\u201d, inform\u00f3 la", "found": false}, {"type": "with", "string": "se iniciaron el fin de semana pasado y", "found": false}, {"type": "with", "string": "el cese el fuego, por lo", "found": false}, {"type": "without", "string": "Algunos se acuerdan de su madre", "found": false}, {"type": "without", "string": "(05:45) Senamhi: DANA \u201cBernardo\u201d", "found": false}, {"type": "without", "string": "Ser madre en el Per\u00fa", "found": false}]}
{"file": "hassanchef.com.bhindi.html", "url": "https://www.hassanchef.com/2020/09/bhindi-masala-okra-stir-fry.html", "text_len": 6822, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Tandoori roti, Naan and paratha are also served with this masala.", "found": true}, {"type": "with", "string": "You can many popular dishes with bhindi like", "found": true}, {"type": "with", "string": "My wife only use red chilli powder", "found": true}, {"type": "without", "string": "Copyright \u00a9 Hassanchef 2020", "found": false}, {"type": "without", "string": "Post a Comment", "found": false}, {"type": "without", "string": "You might like", "found": false}]}
{"file": "homify.de-Tischdecke.html", "url": "https://www.homify.de/diy/20546/wie-man-eine-runde-tischdecke-in-nur-7-schritten-herstellt", "text_len": 144, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Unabh\u00e4ngig von Gr\u00f6\u00dfe und Stil kannst du", "found": false}, {"type": "with", "string": "den Durchmesser (das ist das Ma\u00df,", "found": false}, {"type": "with", "string": "wie du eine runde Tischdecke", "found": false}, {"type": "without", "string": "Kommentare", "found": false}, {"type": "without", "string": "Die Seedball Manufaktur", "found": false}, {"type": "without", "string": "Ern\u00e4hrungsworkshop", "found": false}]}
{"file": "france.attc.org-privatisations.html", "url": "https://france.attac.org/actus-et-medias/dans-les-medias/article/les-privatisations-sont-au-profit-d-interets-prives-financiers-des", "text_len": 388, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Aur\u00e9lie Trouv\u00e9, porte-parole", "found": true}, {"type": "with", "string": "partag\u00e9 pour emp\u00eacher", "found": true}, {"type": "with", "string": " pour parler du", "found": true}, {"type": "without", "string": "Dans la m\u00eame rubrique", "found": false}, {"type": "without", "string": "Je fais un don \u00e0 Attac", "found": false}, {"type": "without", "string": "Abandon du projet", "found": false}]}
{"file": "KATAPULT-Magazin.de-parteien.html", "url": "https://katapult-magazin.de/de/artikel/anzahl-zugelassener-parteien", "text_len": 644, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "es zu viele sind und viele auch nur", "found": true}, {"type": "with", "string": "in wenigen Bundesl\u00e4ndern mit einer Landesliste antreten", "found": true}, {"type": "with", "string": "haben wir uns auf die gr\u00f6\u00dften beschr\u00e4nkt.", "found": true}, {"type": "without", "string": "Neueste Artikel", "found": false}, {"type": "without", "string": "Rechte in MV n\u00f6tigen KATAPULT", "found": false}, {"type": "without", "string": "Rechte, Rechtsextreme und Querdenker aus MV versuchen, KATAPULT einzusch\u00fcchtern. Mit erstem Erfolg. Die Lage ist kritisch. Wir wollen das nicht hinnehmen.", "found": false}]}
{"file": "archive.org.bewegliche-lettern.de.typography.html", "url": "https://web.archive.org/web/20160218174457/http://bewegliche-lettern.de/2010/05/literatur-und-animated-typography/", "text_len": 917, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich schlage darin vor, in der Remix-Kunst der Animated Typography ein Beispiel daf\u00fcr zu sehen", "found": true}, {"type": "with", "string": "und der Literatur vielleicht besonders gerechte", "found": true}, {"type": "without", "string": "Lesenswert: Interview \u00fcber Google Editions in Deutschland", "found": false}, {"type": "without", "string": "Comments are closed.", "found": false}, {"type": "without", "string": "Alle redaktionellen Eigenbeitr\u00e4ge", "found": false}]}
{"file": "security.googleblog.com.protection.html", "url": "https://security.googleblog.com/2020/05/enhanced-safe-browsing-protection-now.html", "text_len": 3822, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "ve seen threats on the web becoming increasingly sophisticated", "found": true}, {"type": "with", "string": "This protocol is designed so that Google cannot", "found": true}, {"type": "with", "string": "billions of users are incredibly diverse, with", "found": true}, {"type": "without", "string": "Give us feedback in our", "found": false}, {"type": "without", "string": "Google Privacy Terms ", "found": false}, {"type": "without", "string": "insights from Google on security and safety on the Internet", "found": false}]}
{"file": "hellogiggles.com.skin.html", "url": "https://hellogiggles.com/beauty/dead-skin-cells-build-up/", "text_len": 5698, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Admit it: Ever since the first rough, grainy glob", "found": true}, {"type": "with", "string": "exfoliating acids, you kind of owe them an apology.", "found": true}, {"type": "with", "string": "Desquamation can only take place when the skin is functioning", "found": true}, {"type": "without", "string": "adhere to in the morning and at night.", "found": false}, {"type": "without", "string": "two makeup artists to get their top tips on how to extend", "found": false}, {"type": "without", "string": "spots caused by melasma, sun damage, or pigmentation", "found": false}]}
{"file": "schweizerjaeger.ch-steinkauz.html", "url": "https://schweizerjaeger.ch/aktuell/vogeldesjahres2021.html", "text_len": 4933, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Botschafter f\u00fcr eine \u00d6kologische", "found": true}, {"type": "with", "string": "Mittelland und Jura in fast", "found": true}, {"type": "with", "string": "aber auch Hecken und", "found": true}, {"type": "without", "string": "WEITERE INTERESSANTE INFORMATIONEN", "found": false}, {"type": "without", "string": "Wildtiere & Lebensr\u00e4ume im Wandel der Zeit", "found": false}, {"type": "without", "string": "Vogel des Jahres 2022: Feldlerche", "found": false}]}
{"file": "macwelt.de-warten.html", "url": "https://www.macwelt.de/ratgeber/iPhone-14-Warum-sich-das-Warten-wirklich-lohnt-11153570.html", "text_len": 10719, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Unternehmen auf Features, die wir durchaus", "found": true}, {"type": "with", "string": "Frontkamera setzen, wie der Experte Ross Young", "found": true}, {"type": "with", "string": "Eine Periskop-Kamera findet sich bereits", "found": true}, {"type": "without", "string": "Shopping24 Angebot", "found": false}, {"type": "without", "string": "Eine kleine runde Aussparung f\u00fcr die Facetime-Kamera", "found": false}, {"type": "without", "string": "Eine kleine runde Aussparung", "found": false}]}
{"file": "Tageswoche.ch-weg.html", "url": "https://tageswoche.ch/gesellschaft/wir-sind-dann-mal-weg-und-dieser-titel-muss-auch-weg-oder/index.html", "text_len": 4724, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Sportredaktor Samuel ist es nach etwas Dramatik", "found": true}, {"type": "with", "string": "singt er halblaut, aber mit Leidenschaft hinter seinem Bildschirm", "found": true}, {"type": "with", "string": "seufzt Catherine eine Pult-Insel entfernt", "found": true}, {"type": "without", "string": "N\u00e4chster Artikel", "found": false}, {"type": "without", "string": "Liebe Verkehrspolitiker, traut euch bitte endlich was!", "found": false}, {"type": "without", "string": "Parkplatzgeb\u00fchren, Fahrverbote, Velowege", "found": false}]}
{"file": "sladisworld.wordpress.com.sigma.html", "url": "https://sladisworld.wordpress.com/2019/12/10/was-wurde-eigentlich-aus-six-sigma/", "text_len": 8574, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Herr Kieser, \u00e4ltere Menschen erinnern sich", "found": true}, {"type": "with", "string": "Was war der zweite Grund?", "found": true}, {"type": "with", "string": "Man muss das n\u00fcchtern sehen", "found": true}, {"type": "without", "string": "Enter your email address to follow", "found": false}, {"type": "without", "string": "Bloggen auf WordPress.com.", "found": false}, {"type": "without", "string": "\u2026through the looking glass\u2026", "found": false}]}
{"file": "archive.org.juergenheitmann.com.aggression.html", "url": "https://web.archive.org/web/20171008220355/http://juergenheitmann.com/essays/2017/01/aggression-fotografie/", "text_len": 3092, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\"To photograph people is to violate them\"", "found": true}, {"type": "with", "string": "in vergangenen Kulturen und unserer aktuellen Gesellschaft (70er Jahre)", "found": true}, {"type": "with", "string": "welche alternativen Ausdr\u00fccke die empfangenden Haltung", "found": true}, {"type": "without", "string": "View all essays by tag", "found": false}, {"type": "without", "string": "#kontemplativ", "found": false}, {"type": "without", "string": "Mindfulness und kontemplative Fotografie", "found": false}]}
{"file": "aerobuzz.de-bremen.html", "url": "https://aerobuzz.de/militar/cae-bildet-kuenftig-luftwaffen-piloten-in-bremen-aus/", "text_len": 2198, "tp": 2, "fn": 1, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "GmbH hat sich bei der Ausschreibung", "found": false}, {"type": "with", "string": "Bremen am Flughafen ein neues Trainingszentrum", "found": true}, {"type": "with", "string": "Industriepartner die Flugzeuge und die", "found": true}, {"type": "without", "string": "Schon gelesen?", "found": true}, {"type": "without", "string": "Die CAE GmbH wird Nachwuchspiloten", "found": false}, {"type": "without", "string": "Luftwaffe hat mit dem Training auf den H145 von NHV begonnen", "found": true}]}
{"file": "finanzcheck.de.finanzierung.html", "url": "https://www.finanzcheck.de/autokredit/leasing-oder-finanzierung/", "text_len": 13429, "tp": 5, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Im Vergleich zum Leasing geh\u00f6rt bei der Finanzierung das Fahrzeug am Ende dem Halter", "found": true}, {"type": "with", "string": "auch die Leasingraten senken, indem die Kunden eine Anzahlung leisten.", "found": true}, {"type": "with", "string": "Leasingvertr\u00e4ge erstrecken sich meist", "found": true}, {"type": "with", "string": "Effektiver Jahreszins: 3,9 Prozent", "found": true}, {"type": "with", "string": "h\u00f6heres Verschlei\u00dfrisiko aufgrund einer l\u00e4ngeren Nutzungsdauer", "found": true}, {"type": "without", "string": "Gemeinsam finden wir Ihren passenden Kredit!", "found": false}, {"type": "without", "string": "0,00% fester Sollzins", "found": false}, {"type": "without", "string": "3737 Bewertungen", "found": false}]}
{"file": "diem25.org.climate.html", "url": "https://diem25.org/the-eus-green-deal-isnt-enough-save-from-climate-catastrophe/", "text_len": 5763, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Due to the rise of movements dedicated to addressing", "found": true}, {"type": "with", "string": "The Green New Deal for Europe is the most", "found": true}, {"type": "with", "string": "To answer this question, the starting point should", "found": true}, {"type": "without", "string": "Democracy in Europe Movement 2025", "found": false}, {"type": "without", "string": "Do you want to be informed of DiEM25", "found": true}, {"type": "without", "string": "empower workers on an unprecedented scale.", "found": false}]}
{"file": "aclu.org-grades.html", "url": "https://www.aclu.org/blog/juvenile-justice/school-prison-pipeline/county-criminalized-students-bad-grades-until-now", "text_len": 4496, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "criminal justice system.", "found": true}, {"type": "with", "string": "more than a decade", "found": true}, {"type": "with", "string": "many areas of juvenile", "found": true}, {"type": "without", "string": "Fight for everyone's rights", "found": false}, {"type": "without", "string": "RELATED STORIES", "found": false}, {"type": "without", "string": "of Our Students", "found": false}]}
{"file": "hoy.com-daran.html", "url": "https://www.hoy.com.py/nacionales/daran-bendicion-a-vehiculos-este-sabado", "text_len": 10262, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "a ocasi\u00f3n tambi\u00e9n para entregar una", "found": true}, {"type": "with", "string": "cuidado que se debe tener con respecto a la", "found": true}, {"type": "with", "string": "Hermanos Franciscanos Capuchinos realizar\u00e1n", "found": true}, {"type": "without", "string": "Etiquetas:", "found": false}, {"type": "without", "string": "La bendici\u00f3n se realizar\u00e1 ma\u00f1ana. Foto: LN", "found": false}, {"type": "without", "string": "Beb\u00e9 muere electrocutado al", "found": true}]}
{"file": "unocero.com.marcas.html", "url": "https://www.unocero.com/smartphones/marcas-mala-gestion-apps-segundo-plano-android/", "text_len": 2672, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "pues al hacer esto se gastaba mucha", "found": true}, {"type": "with", "string": "El problema es que a pesar de que", "found": true}, {"type": "with", "string": "convierten en una desventaja para la experiencia de uso.", "found": true}, {"type": "without", "string": "y te enviaremos un correo diario con lo", "found": false}, {"type": "without", "string": "Derechos Reservados. unocero es una", "found": false}, {"type": "without", "string": "Modo Nocturno", "found": false}]}
{"file": "german.stackexchange.com.ausgeraubt.html", "url": "https://german.stackexchange.com/questions/10376/when-to-use-wurde-versus-war-eg-ich-wurde-ausgeraubt-vs-ich-war-ausgerau", "text_len": 1073, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "How does one know", "found": false}, {"type": "with", "string": "Ich wurde ausgeraubt", "found": false}, {"type": "with", "string": "in that context", "found": false}, {"type": "without", "string": "2 months ago", "found": false}, {"type": "without", "string": "20:37", "found": false}, {"type": "without", "string": "Sorted by", "found": false}]}
{"file": "pluralsight.com.python.html", "url": "https://www.pluralsight.com/tech-blog/managing-python-environments/", "text_len": 28241, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "self-contained = deployable", "found": true}, {"type": "with", "string": "<config files>", "found": true}, {"type": "without", "string": "21 minutes", "found": false}, {"type": "without", "string": "Tags:", "found": false}]}
{"file": "foxyfolksy.com.buttercream.html", "url": "https://www.foxyfolksy.com/chocolate-buttercream-frosting-without-powdered-sugar-ermine-icing/", "text_len": 17446, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Try this Chocolate Buttercream Frosting. No powdered sugar", "found": true}, {"type": "with", "string": "Combine and sift together the flour, sugar, salt", "found": true}, {"type": "with", "string": "work but definitely easier than Swiss Meringue Frosting", "found": true}, {"type": "without", "string": "Send me email every new post.", "found": false}, {"type": "without", "string": "Receive new posts directly delivered to your inbox", "found": false}, {"type": "without", "string": "miss a post. Get updates directly to your inbox ", "found": false}]}
{"file": "en.wikipedia.org.tsne.html", "url": "https://en.wikipedia.org/wiki/T-distributed_stochastic_neighbor_embedding", "text_len": 7203, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Given a set of high-dimensional objects", "found": true}, {"type": "with", "string": "Herein a heavy-tailed Student t-distribution", "found": true}, {"type": "without", "string": "Categories:", "found": false}, {"type": "without", "string": "Conditional random field", "found": false}]}
{"file": "travanto.de.ferienhaus-feinen.html", "url": "https://www.travanto.de/ferienhaus/lierfeld/40222/ferienhaus-feinen.php", "text_len": 5143, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir haben unser altes Bauernhaus zu einem", "found": true}, {"type": "with", "string": "Das idyllische Eifeld\u00f6rfchen Lierfeld liegt", "found": true}, {"type": "with", "string": "Kinder unter 4 Jahren werden nicht als", "found": true}, {"type": "without", "string": "Travanto Buchungshotline", "found": false}, {"type": "without", "string": "tolle Gewinnspiele", "found": false}, {"type": "without", "string": " TrustScore 4.2 580 Bewertungen", "found": false}]}
{"file": "bmwi.de-neubau.html", "url": "https://www.bmwi.de/Redaktion/DE/Meldung/2022/20220124-foerderung-fur-energieeffiziente-gebaude-durch-kfw.html", "text_len": 5829, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": " EH55 Neubauf\u00f6rderung hat", "found": true}, {"type": "with", "string": "wieder aufgenommen, sobald", "found": true}, {"type": "with", "string": "\u00dcber die Zukunft der Neubauf\u00f6rderung", "found": true}, {"type": "without", "string": "Verwandte Themen", "found": false}, {"type": "without", "string": "Europ\u00e4ische und internationale Energiepolitik", "found": false}, {"type": "without", "string": "MEDIENRAUM", "found": false}]}
{"file": "motorsport-magazin.com-alphatauri.html", "url": "https://www.motorsport-magazin.com/formel1/news-275350-formel-1-fahrercheck-alphatauri-das-koennen-pierre-gasly-yuki-tsunoda-f1-2022/", "text_len": 4195, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "beginnt das Jahr mit einem Fahrer-Formcheck", "found": true}, {"type": "with", "string": "Fehltritte ein, die hin und wieder auch gro\u00dfe Konsequenzen haben.", "found": true}, {"type": "with", "string": "zeigt, ist, dass er gelegentlich Gefahr", "found": true}, {"type": "without", "string": "Formel 1 - Pierre Gasly", "found": false}, {"type": "without", "string": "mischt Top-Teams", "found": false}, {"type": "without", "string": "Motorsport-Magazin.com Redakteur", "found": false}]}
{"file": "helmholtz-klima.de.kipppunkt.html", "url": "https://www.helmholtz-klima.de/aktuelles/kein-kipppunkt-zugunsten-des-klimaschutzes", "text_len": 6546, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u201eDie multilaterale Diplomatie", "found": true}, {"type": "with", "string": "Der Fonds hat", "found": true}, {"type": "with", "string": "Christoph Bals von der Umweltorganisation", "found": true}, {"type": "without", "string": "MEHR ZUM THEMA", "found": false}, {"type": "without", "string": "NEWSLETTERANMELDUNG", "found": false}, {"type": "without", "string": "AUF DEM LAUFENDEN BLEIBEN!", "found": false}]}
{"file": "arbeit-und-arbeitsrecht.de.urlaub.html", "url": "https://www.arbeit-und-arbeitsrecht.de/news/verjaehrung-von-urlaubsanspruechen.html", "text_len": 4407, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der Beklagte besch\u00e4ftigte", "found": true}, {"type": "with", "string": "Der Senat hat damit die", "found": true}, {"type": "with", "string": "Pressemitteilung Nr. 48/22", "found": true}, {"type": "without", "string": "Jetzt zum kostenlosen Newsletter anmelden", "found": false}, {"type": "without", "string": "Recherche im Archiv", "found": false}, {"type": "without", "string": "Redaktions-Newsletter", "found": false}]}
{"file": "Eurostat_ Polska z najni\u017cszym bezrobociem w ca\u0142ej UE.html", "url": "https://dorzeczy.pl/ekonomia/183131/eurostat-polska-z-najnizszym-bezrobociem-w-calej-ue.html", "text_len": 1575, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wyr\u00f3wnana sezonowo stopa", "found": true}, {"type": "with", "string": "Holandia (3,5 proc.).", "found": true}, {"type": "with", "string": "najni\u017csza w UE \u2013 poda\u0142 Eurostat.", "found": false}, {"type": "without", "string": "Praca w magazynie", "found": false}, {"type": "without", "string": "\u0179r\u00f3d\u0142o:", "found": false}, {"type": "without", "string": "NAJNOWSZE", "found": false}]}
{"file": "fluessiggas.de.dimethylether.html", "url": "https://fluessiggas.de/aktuelles/dimethylether/", "text_len": 1590, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Nachfrage nach erneuerbaren Energien", "found": false}, {"type": "with", "string": "Verbraucher in Deutschland k\u00f6nnen bereits", "found": false}, {"type": "with", "string": "Die Aussicht, dass erneuerbarer Dimethylether", "found": false}, {"type": "without", "string": "Verwandte Themenbereiche", "found": false}, {"type": "without", "string": "Highlights aus dem Bereich:", "found": false}, {"type": "without", "string": "Beitrag teilen", "found": false}]}
{"file": "bunterepublik.wordpress.com.talstrasse.html", "url": "https://bunterepublik.wordpress.com/2017/06/12/keine-spiel-talstrasse-zur-bunten-republik-neustadt/", "text_len": 1791, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zur Bunten Republik Neustadt 2017", "found": true}, {"type": "with", "string": "Zur Bunten Republik Neustadt 2017", "found": true}, {"type": "with", "string": "Zur Bunten Republik Neustadt 2017", "found": true}, {"type": "without", "string": "Abgelegt unter Aktuelles", "found": false}, {"type": "without", "string": "Der Inhalt dieser Seite steht", "found": false}, {"type": "without", "string": "Bloggen auf WordPress.com", "found": false}]}
{"file": "arsnova.thm.de.frag.html", "url": "https://arsnova.thm.de/blog/frag-jetzt/", "text_len": 2688, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "live moderierbar", "found": true}, {"type": "with", "string": "einen Workshop an", "found": true}, {"type": "with", "string": "im H\u00f6rsaal Fragen", "found": true}, {"type": "without", "string": "ARSnova-Workshop an der Uni Wien", "found": false}, {"type": "without", "string": "wird nicht ver\u00f6ffentlicht", "found": false}, {"type": "without", "string": "Technische Hochschule Mittelhessen", "found": false}]}
{"file": "1337kultur.de.picard.html", "url": "https://1337kultur.de/2020/folge-70-star-trek-picard/", "text_len": 1760, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Thema dieser Folge ist", "found": false}, {"type": "with", "string": "f\u00fcnften Episode der", "found": false}, {"type": "with", "string": "Wir werden spoilern", "found": true}, {"type": "without", "string": "Leet-Kultur \u2013 Kultur aus der Nerdperspektive", "found": false}, {"type": "without", "string": "Hohe Qualit\u00e4t Livestream in hoher Qualit\u00e4t (128 kbit/s)", "found": false}, {"type": "without", "string": "Lizenz des Podcasts", "found": false}]}
{"file": "nhk.or.jp.k100.html", "url": "https://www3.nhk.or.jp/news/easy/k10011959621000/k10011959621000.html", "text_len": 372, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u5b50\u3069\u3082\u3078\u306e\u8650\u5f85\u3092\u306a\u304f\u3059\u305f\u3081\u306e\u6cd5\u5f8b\u304c\u3067\u304d\u3066\u3001\u89aa\u304c\u5b50\u3069\u3082\u3092\u6559\u80b2\u3059\u308b\u305f\u3081\u306b\u3001", "found": true}, {"type": "with", "string": "\u6cd5\u5f8b\u3067\u306f\u8650\u5f85\u3092\u3057\u305f\u89aa\u306b\u5c02\u9580\u5bb6\u304c\u5b50\u3069\u3082\u306e\u80b2\u3066\u65b9\u3092", "found": true}, {"type": "with", "string": "\u8650\u5f85\u3057\u305f\u3068\u304d\u306b\u53f1\u3063\u3066\u3044\u305f\u3060\u3051\u3060\u3068\u8a00\u3046\u89aa\u304c\u3044\u307e\u3059\u3002\u65b0\u3057\u3044\u6cd5\u5f8b\u3067\u306f", "found": true}, {"type": "without", "string": "\u203b\u4e0b\u306b\u7dda\u304c\u3042\u308b\u3053\u3068\u3070\u306f\u8f9e\u66f8\u306e\u8aac\u660e\u3092\u898b\u308b\u3053\u3068\u304c\u3067\u304d\u307e\u3059\u3002 ", "found": false}, {"type": "without", "string": "\u304f\u8ee2\u8f09\u3059\u308b\u3053\u3068\u3092\u7981\u3058\u307e\u3059\u3002\u3053\u306e\u30da\u30fc\u30b8\u306f\u53d7\u4fe1\u6599\u3067\u5236\u4f5c\u3057\u3066\u3044\u307e\u3059\u3002", "found": false}, {"type": "without", "string": "Copyright NHK (Japan Broadcasting Corporation).", "found": false}]}
{"file": "bfn.de-verden.html", "url": "https://www.bfn.de/pressemitteilungen/allervielfalt-verden-bringt-natur-die-aller-zurueck", "text_len": 4611, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "5,1 Millionen Euro f\u00fcr die erste F\u00f6rderphase", "found": false}, {"type": "with", "string": "Interessen von Landwirtschaft und", "found": true}, {"type": "with", "string": "einer gemeinsamen Initiative von", "found": true}, {"type": "without", "string": "Weiterf\u00fchrende Informationen", "found": false}, {"type": "without", "string": "Das Projektgebiet an der Aller", "found": false}, {"type": "without", "string": "Bundesprogramm \u201eBlaues Band Deutschland\u201c", "found": false}]}
{"file": "couchstyle.de.vintage.html", "url": "https://www.couchstyle.de/living/homestory/vintage-flair-mit-sehr-viel-gruen--1597", "text_len": 401, "tp": 2, "fn": 1, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Vintage trifft Urban Jungle", "found": true}, {"type": "with", "string": "Am alten K\u00fcchentisch", "found": true}, {"type": "with", "string": "Der Barschrank aus den 50er Jahre", "found": false}, {"type": "without", "string": "Entdecke weitere Homestorys", "found": true}, {"type": "without", "string": "Community", "found": true}, {"type": "without", "string": "Abo", "found": false}]}
{"file": "publimetro.cl-ministra.html", "url": "https://www.publimetro.cl/noticias/2022/05/04/ministra-de-la-mujer-por-berrios-que-la-justicia-penal-investigue-no-la-canonica/", "text_len": 2169, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "a la denuncia que recae en contra", "found": true}, {"type": "with", "string": "en declaraciones a T13 Noche.", "found": true}, {"type": "with", "string": "mayor celeridad posible\u201d, a\u00f1adi\u00f3.", "found": true}, {"type": "without", "string": "S\u00edguenos en", "found": false}, {"type": "without", "string": "LO \u00daLTIMO", "found": false}, {"type": "without", "string": "\u201cNos pill\u00f3 de sorpresa\u201d", "found": false}]}
{"file": "Ostbelgiendirekt.be-ARD-Doku.html", "url": "https://ostbelgiendirekt.be/tv-tipp-loriot-100-367167", "text_len": 5352, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die ARD hat f\u00fcr ihre Mediathek", "found": true}, {"type": "with", "string": "eine umfangreiche Schau mit Loriots bekanntesten Werken", "found": true}, {"type": "with", "string": "Das Widget mit den ikonischen Sketch- und Cartoon-Klassikern von SWR", "found": true}, {"type": "without", "string": "Popul\u00e4re Artikel der letzten 7 Tage", "found": false}, {"type": "without", "string": "Aktuelle Kommentare", "found": false}, {"type": "without", "string": "Alles nur Satire", "found": false}]}
{"file": "gartenjournal.net-Zaubernuss.html", "url": "https://www.gartenjournal.net/zaubernuss-im-winter", "text_len": 1799, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "filigrane Bl\u00fcten mit bis zu 4 cm", "found": true}, {"type": "with", "string": "bevor der Wurzelballen austrocknet", "found": true}, {"type": "with", "string": "keine besondere Winterpflege n\u00f6tig", "found": true}, {"type": "without", "string": "Hier weiterlesen", "found": false}, {"type": "without", "string": "Wie gro\u00df wird die", "found": false}, {"type": "without", "string": "Lesen Sie auch", "found": false}]}
{"file": "wolfgangschmale.eu.duchhardt.html", "url": "https://wolfgangschmale.eu/abgebrochene-forschung-eine-neue-studie-von-heinz-duchhardt/", "text_len": 8991, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "[1] Wer im Wissenschaftsbetrieb w\u00fcrde", "found": true}, {"type": "with", "string": "Band zwei alsbald folgen zu lassen", "found": true}, {"type": "with", "string": "[8] Historiker oder Geschichte als Fach", "found": true}, {"type": "without", "string": "Wenn Sie diesen Blogeintrag kommentieren", "found": false}, {"type": "without", "string": "Diese Website verwendet Akismet", "found": false}, {"type": "without", "string": "Neueste Kommentare", "found": false}]}
{"file": "blog.wordpress.com.diverse.html", "url": "https://en.blog.wordpress.com/2019/06/19/want-to-see-a-more-diverse-wordpress-contributor-community-so-do-we/", "text_len": 3634, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Why WordCamps?", "found": true}, {"type": "with", "string": "which makes WordPress better for more people.", "found": true}, {"type": "with", "string": "Get in touch with Jill", "found": true}, {"type": "without", "string": "Missing out on the latest", "found": false}, {"type": "without", "string": "Opens in new window", "found": false}, {"type": "without", "string": "Jill Binder, speaking at a WordCamp", "found": false}]}
{"file": "d32ad974a4b04657bb6e4d91852bd52d.html", "url": "https://www.tichyseinblick.de/kolumnen/spahns-spitzwege/no-peace-for-our-time-pence-syrien-und-die-tuerkei/", "text_len": 15023, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "war 1938 der Auftakt zur bisher gr\u00f6\u00dften", "found": true}, {"type": "with", "string": "Frieden in unserer Zeit?", "found": true}, {"type": "with", "string": "Au\u00dfer Kuscheleinheiten nichts gewesen.", "found": true}, {"type": "without", "string": "T\u00e4glich schreiben unabh\u00e4ngige", "found": false}, {"type": "without", "string": "Unterst\u00fctzen Sie diese Form", "found": false}, {"type": "without", "string": "T\u00fcrkei: Der euroamerikanische Abschied aus der Weltpolitik", "found": false}]}
{"file": "next2games.de.anno.html", "url": "https://next2games.de/previews,id1085,0,anno_1800_beta.html", "text_len": 7283, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "zu entdecken, was Anno 1800 noch in petto h\u00e4lt.", "found": true}, {"type": "with", "string": "Neben dem Startgebiet in einer klimatisch eher gem\u00e4\u00dfigten", "found": true}, {"type": "with", "string": "Wie in jedem Titel der mittlerweile \u00fcber 20 Jahre", "found": true}, {"type": "without", "string": "n2g media network", "found": false}, {"type": "without", "string": "CMS: Apexx by Stylemotion", "found": false}, {"type": "without", "string": "Diese Website nutzt Cookies", "found": false}]}
{"file": "motor.at-elektroroller.html", "url": "https://motor.at/zweirad/seat-mo-125-der-elektroroller-im-test/401755605", "text_len": 3270, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der (Elektro-)Roller versteht", "found": true}, {"type": "with", "string": "Mo 125 auf 95 km/h", "found": true}, {"type": "with", "string": "man noch die F\u00f6rderung", "found": true}, {"type": "without", "string": "Kommentare gepostet", "found": false}, {"type": "without", "string": "motor.at, and", "found": false}, {"type": "without", "string": "Bild: Werk/CHRISTIAN HOUDEK", "found": false}]}
{"file": "elenacional.com-carta.html", "url": "https://www.elnacional.com/venezuela/carta-abierta-un-nuevo-espacio-donde-el-nacional-recibira-las-denuncias-de-sus-lectores/", "text_len": 1244, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u00abQueremos contar las historias desde", "found": true}, {"type": "with", "string": "gente, crear v\u00ednculos y sobre todo", "found": true}, {"type": "with", "string": "voz del venezolano\u00bb, resalt\u00f3 Makriniotis.", "found": true}, {"type": "without", "string": "El Nacional recibir\u00e1 cartas", "found": false}, {"type": "without", "string": "MINUTO A MINUTO", "found": false}, {"type": "without", "string": "desapariciones forzadas en Brasil", "found": false}]}
{"file": "rs-ingenieure.de.tragwerksplanung.html", "url": "http://www.rs-ingenieure.de/de/hochbau/leistungen/tragwerksplanung", "text_len": 437, "tp": 1, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "Wir bearbeiten alle Leistungsbilder", "found": true}, {"type": "without", "string": "Br\u00fcckenbau", "found": false}]}
{"file": "d43f330cbaf74e92b9aec85e937cb904.html", "url": "https://www.mactechnews.de/forum/discussion/kein-App-Store-mehr-ueber-Mobile-Daten-mit-iOS-13--338679.html.html", "text_len": 14584, "tp": 2, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "one 11 und xs und ipads sind keinen zugriff mehr auf den appstore", "found": true}, {"type": "with", "string": "und bevor wieder die \u00fcbliche h\u00e4me", "found": true}, {"type": "without", "string": "Kommentieren", "found": true}, {"type": "without", "string": "Sie m\u00fcssen sich einloggen, um sich an einer Diskussion beteiligen zu k\u00f6nnen.", "found": false}, {"type": "without", "string": "wo immer es sinnvoll erscheint. Sie unterst\u00fctzen", "found": false}]}
{"file": "archive.org.przepisy.pl.pierogi.html", "url": "https://web.archive.org/web/20200808063632/https://www.przepisy.pl/przepis/pierogi-z-dynia-w-sosie-szalwiowym", "text_len": 2787, "tp": 3, "fn": 0, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "ugotowane pierogi, chwil\u0119 wymieszaj i natychmiast podawaj.", "found": true}, {"type": "with", "string": "Przyprawa w Mini kostkach Sma\u017cona cebula", "found": true}, {"type": "with", "string": "Przygotowanie krok po kroku", "found": true}, {"type": "without", "string": "S\u0142odkie i soczyste owoce, kt\u00f3re mog\u0105 by\u0107", "found": true}, {"type": "without", "string": "si\u0119 do niego warzywa, sery, mi\u0119so, zio\u0142a. Skorzystaj z", "found": true}, {"type": "without", "string": "To naprawd\u0119 pyszne danie \u2013 przekonaj si\u0119?", "found": true}]}
{"file": "blinker.de-Rostock.html", "url": "https://www.blinker.de/angelmethoden/angeln-allgemein/news/fishing-masters-show-in-rostock-findet-naechstes-jahr-statt/", "text_len": 2363, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "IGA Park alles ums Angeln drehen.", "found": false}, {"type": "with", "string": "coronabedingten Verschiebungen steht", "found": true}, {"type": "with", "string": "frischem R\u00e4ucherfisch und vielen", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "Bild: Jahr Media", "found": false}, {"type": "without", "string": "Wir erstellen Ihr", "found": false}]}
{"file": "seelenradio.de.leo.html", "url": "http://www.seelenradio.de/nummer-zwei-leo/", "text_len": 269, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es ist schon einige Zeit", "found": true}, {"type": "with", "string": "=)", "found": true}, {"type": "with", "string": "So sah es aus", "found": true}, {"type": "without", "string": "seelenradio is powered by", "found": false}, {"type": "without", "string": "Say your words", "found": false}, {"type": "without", "string": "No Response so far", "found": false}]}
{"file": "ritinardo.wordpress.com.btw17.html", "url": "https://ritinardo.wordpress.com/2017/11/26/bundesregierung-2017-btw17-groko/", "text_len": 5398, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wenn man so h\u00f6rt und liest", "found": true}, {"type": "with", "string": "Deutschland ist ein Land", "found": true}, {"type": "with", "string": "SPD und FDP haben dieses mal vieles", "found": true}, {"type": "without", "string": "Erstelle eine kostenlose Website oder Blog", "found": false}, {"type": "without", "string": "Teilen Sie dies mit:", "found": false}, {"type": "without", "string": "Fall #Amani, was passiert denn da? #aboutyouawards", "found": false}]}
{"file": "pagesix.com.myers.html", "url": "https://pagesix.com/2020/02/24/former-wh-press-secretary-dee-dee-myers-exits-warner-bros-role/", "text_len": 615, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dee Dee Myers \u2014 a White House press secretary for Bill Clinton", "found": true}, {"type": "with", "string": "\u201cI\u2019m going to take some time to figure out what\u2019s next", "found": true}, {"type": "with", "string": "Her last day is April 1", "found": true}, {"type": "without", "string": "Getty Images", "found": false}, {"type": "without", "string": "Filed under", "found": false}, {"type": "without", "string": "Most Popular This Week", "found": false}]}
{"file": "economictimes.indiatimes.com.slideshow.html", "url": "https://economictimes.indiatimes.com/tech/hardware/the-iphone-se-is-in-india-heres-all-we-know/not-a-flagship/slideshow/76280131.cms", "text_len": 503, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The latest iPhone from Apple is not what", "found": false}, {"type": "with", "string": "All of this - coupled with better cameras - comes", "found": false}, {"type": "with", "string": "But, the iPhone SE fits in so much more", "found": false}, {"type": "without", "string": "Apple has just updated the 13-inch MacBook Pro", "found": false}, {"type": "without", "string": "for a smoother typing experience, according to Apple.", "found": false}, {"type": "without", "string": "production and sales but new models are still being ", "found": false}]}
{"file": "hausinfo.ch-kondenswasser.html", "url": "https://hausinfo.ch/de/wohnen/wohnen-leben/angenehmes-raumklima/kondenswasser.html", "text_len": 3586, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Fenstern nicht durch \u00fcberstellte Fensterb\u00e4nke", "found": true}, {"type": "with", "string": "Dies schl\u00e4gt sich aber in", "found": true}, {"type": "with", "string": "Luftfeuchtigkeit im Raum sorgen", "found": true}, {"type": "without", "string": "Kondenswasser an den Fensterr\u00e4ndern", "found": true}, {"type": "without", "string": "Angenehmes Raumklima", "found": false}, {"type": "without", "string": "Gesund wohnen", "found": false}]}
{"file": "dtb.de-kulturwandel.html", "url": "https://www.dtb.de/weitere-nachrichten/nachrichten/artikel/massnahmen-umgesetzt-und-kulturwandel-angestossen", "text_len": 12847, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Verantwortlichen Zeit, eine erste Bilanz zu ziehen", "found": true}, {"type": "with", "string": "Pr\u00e4ventions- und Interventionskonzept zum Schutz", "found": true}, {"type": "with", "string": "die Ergebnisse aus verschiedenen Perspektiven", "found": true}, {"type": "without", "string": "Weiterf\u00fchrende Links", "found": false}, {"type": "without", "string": "Kultur- und Strukturwandel im DTB \u2013 ein Zwischenfazit", "found": false}, {"type": "without", "string": "Weitere Informationen hierzu gibt es in K\u00fcrze auf der Website des", "found": true}]}
{"file": "elnuevodia.com-mujeres.html", "url": "https://www.elnuevodia.com/noticias/politica/notas/lider-de-la-organizacion-mujeres-populares-denuncia-intentos-del-ppd-de-silenciarla/", "text_len": 360, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Jos\u00e9 Luis Dalmau relacionadas al aborto", "found": false}, {"type": "with", "string": "posturas p\u00fablicas en contra de la", "found": true}, {"type": "with", "string": "que se han practicado un aborto.", "found": true}, {"type": "without", "string": "Jos\u00e9 Luis Dalmau indica que el", "found": false}, {"type": "without", "string": "Carlos Delgado Altieri", "found": false}, {"type": "without", "string": "Ada \u00c1lvarez Conde anticip\u00f3 que renunciar\u00e1", "found": false}]}
{"file": "github.com.yapapi.html", "url": "https://github.com/golemfactory/yapapi", "text_len": 3766, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Golem application development", "found": true}, {"type": "with", "string": "poetry add yapapi", "found": true}, {"type": "with", "string": "YAGNA_PAYMENT_DRIVER", "found": true}, {"type": "without", "string": "Watchers", "found": false}, {"type": "without", "string": "2022 GitHub", "found": false}, {"type": "without", "string": "Failed to load latest commit information", "found": false}]}
{"file": "bumsbutzener-gumpfen.blogspot.com.tach-auch.html", "url": "https://bumsbutzener-gumpfen.blogspot.com/2020/04/tach-auch.html", "text_len": 6028, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich h\u00e4tte zwar das ein oder andere Mal noch Lust gehabt, den ein oder ande", "found": true}, {"type": "with", "string": "weck verfolgt, Kranke zu heilen und Brunnen zu bauen.", "found": true}, {"type": "with", "string": "Oder, um es mit Reinhard Mey zu sagen:", "found": true}, {"type": "without", "string": "Dieses Blog durchsuchen", "found": false}, {"type": "without", "string": "Eingestellt von der Michel", "found": false}, {"type": "without", "string": "Nachdem ProSieben mit seinem Auktionshaus", "found": false}]}
{"file": "peppermynta.de-Strickmode.html", "url": "https://peppermynta.de/fashion-guides/fair-fashion-strick-nachhaltige-strickmode-mulesingfrei-knitwear/", "text_len": 14489, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Was w\u00e4re Wintermode ohne kuschelige Knitwear", "found": true}, {"type": "with", "string": "und ist gerade in der konventionellen Tierhaltung oftmals mit viel Tierleid verbunden", "found": true}, {"type": "with", "string": "Fairer Strick Made in Europe", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Dich auch noch interessieren", "found": false}, {"type": "without", "string": "Kennt ihr schon unseren Brandfinder?", "found": true}, {"type": "without", "string": "Studiert im Master European Culture and Economy", "found": false}]}
{"file": "utopia.de-Werbung.html", "url": "https://utopia.de/news/was-haben-bhs-mit-eisbergen-zu-tun-kim-kardashian-polarisiert-mit-werbung-nippel/", "text_len": 4450, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Kim Kardashian hat 2019 die inklusive Shapewear-Marke", "found": true}, {"type": "with", "string": "mitgegr\u00fcndet und macht nun Werbung f\u00fcr ein neues Produkt", "found": true}, {"type": "with", "string": "Auf Instagram erschien vor kurzem ein Spot", "found": true}, {"type": "without", "string": "Aktuelle News", "found": false}, {"type": "without", "string": "Beliebte Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Beliebte Bestenlisten", "found": false}]}
{"file": "iloveponysmag.com.barbour.html", "url": "http://iloveponysmag.com/2018/05/24/barbour-coastal/", "text_len": 4416, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Eine meiner besten Entscheidungen bisher:", "found": true}, {"type": "with", "string": "Verlassenes Gew\u00e4chshaus meets versteckter Deich", "found": true}, {"type": "with", "string": "Der Hundestrand in Stein an der Ostsee", "found": true}, {"type": "without", "string": "Tags: Barbour,", "found": false}, {"type": "without", "string": "Bitte (noch) mehr Bilder von Helle", "found": false}, {"type": "without", "string": "Hinterlasse einen Kommentar", "found": false}]}
{"file": "hearya.com.metal.html", "url": "http://www.hearya.com/2006/12/04/hit-paraders-top-100-metal-vocalists-of-all-time/", "text_len": 2336, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "100. Ray Gillen", "found": true}, {"type": "with", "string": "Keith Caputo, Life of Agony", "found": true}, {"type": "with", "string": "I\u2019m not much of a metal guy these days, but I dabbled", "found": true}, {"type": "without", "string": "Leave a Comment", "found": false}, {"type": "without", "string": "Recent Comments", "found": false}, {"type": "without", "string": "Blogroll", "found": false}]}
{"file": "gregoryszorc.com.python3.html", "url": "https://gregoryszorc.com/blog/2020/01/13/mercurial%27s-journey-to-and-reflections-on-python-3/", "text_len": 39118, "tp": 3, "fn": 0, "fp": 1, "tn": 1, "details": [{"type": "with", "string": "This effort began in earnest", "found": true}, {"type": "with", "string": "Within a few months,", "found": true}, {"type": "with", "string": "Python had a wildly successful past", "found": true}, {"type": "without", "string": "View the discussion thread.", "found": false}, {"type": "without", "string": "January 13", "found": true}]}
{"file": "reiterrevue.de-heulage.html", "url": "https://www.reiterrevue.de/ausbildung-und-praxis/fuetterung/heulage-besser-als-ihr-ruf-12842649.html", "text_len": 2163, "tp": 1, "fn": 2, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Pferdefutter einen weniger guten Ruf.", "found": false}, {"type": "with", "string": ",die die Heulage haltbar machen, die nat\u00fcrli", "found": false}, {"type": "with", "string": "\u201eatmen\u201c und gammelt schnell.", "found": true}, {"type": "without", "string": "Heu ist die Grundlage einer", "found": true}, {"type": "without", "string": "und Schimmelpilze. Was Sie bei", "found": false}, {"type": "without", "string": "DAS PERFEKTE DINNER", "found": false}]}
{"file": "phillyvoice.com-Sixers.html", "url": "https://www.phillyvoice.com/sixers-76ers-score-record-news-analysis-celtics-joel-embiid-tyrese-maxey-jayson-tatum/", "text_len": 5236, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "It was an underwhelming first quarter on both sides", "found": true}, {"type": "with", "string": "as the Sixers and Celtics each struggled mightily to knock down shots", "found": true}, {"type": "with", "string": "The Sixers went 0-for-9 from three-point range in the period", "found": true}, {"type": "without", "string": "Certain personality traits", "found": false}, {"type": "without", "string": "like being an extrovert", "found": false}, {"type": "without", "string": "may lower risk for dementia", "found": false}]}
{"file": "kulinariaathome.com.mandelpl\u00e4tzchen.html", "url": "http://kulinariaathome.wordpress.com/2012/12/08/mandelplatzchen/", "text_len": 744, "tp": 4, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "(+ 15 Minuten backen)", "found": true}, {"type": "with", "string": "200 g Zucker", "found": true}, {"type": "with", "string": "zu einem glatten Teig verarbeiten.", "found": true}, {"type": "with", "string": "Ein Backblech mit Backpapier auslegen.", "found": true}, {"type": "without", "string": "Sharen mit", "found": false}, {"type": "without", "string": "Creative Commons", "found": false}, {"type": "without", "string": "Trotz sorgf\u00e4ltiger inhaltlicher Kontrolle", "found": false}]}
{"file": "gv-bayern.de.portraet.html", "url": "https://www.gv-bayern.de/standard/artikel/der-genossenschaftsverband-bayern-im-portraet-775", "text_len": 1722, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der Genossenschaftsverband Bayern (GVB) vertritt", "found": true}, {"type": "with", "string": "Wir sind der gesetzliche Pr\u00fcfungsverband", "found": true}, {"type": "with", "string": "unserer Mitglieder und verschaffen ihnen so Geh\u00f6r", "found": true}, {"type": "without", "string": "Meldungen", "found": false}, {"type": "without", "string": "Meist gelesene Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Historischer Verein", "found": false}]}
{"file": "archive.org.time4talks.com.kinos.html", "url": "https://web.archive.org/web/20140226054445/http://www.time4talks.com/2013/08/07/weitere-digitalisierung-der-schweizer-kinos/", "text_len": 739, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Umstellung auf Hightech-Beamer hat n\u00e4mlich kein Kinosterben verursacht", "found": true}, {"type": "with", "string": "Das BAK will mit diesen Beitr\u00e4gen die Digitalisierung", "found": true}, {"type": "with", "string": "Auf 270 Leinw\u00e4nden sind auch 3-D-Filme zu sehen.", "found": true}, {"type": "without", "string": "Bisher keine Kommentare", "found": false}, {"type": "without", "string": "(erforderlich)", "found": false}, {"type": "without", "string": "Nutzen Sie unsere Tools", "found": false}]}
{"file": "verbaende.com.2023.html", "url": "https://www.verbaende.com/news/pressemitteilung/das-aendert-sich-im-jahr-2023-die-wichtigsten-aenderungen-fuer-verbraucherinnen-im-ueberblick-151642/", "text_len": 8324, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "(Leipzig) - Von Preisbremsen", "found": true}, {"type": "with", "string": "Private Solaranlagen:", "found": true}, {"type": "with", "string": "Mehrwegpflicht f\u00fcrs Essen zum Mitnehmen:", "found": true}, {"type": "without", "string": "Weitere Pressemitteilungen dieses Verbands", "found": false}, {"type": "without", "string": "Folgen Sie uns", "found": false}, {"type": "without", "string": "NEWS TEILEN:", "found": false}]}
{"file": "der-farang.com-Grab-Bote.html", "url": "https://der-farang.com/de/pages/frei-erfunden-grab-bote-fliegt-nach-singapur", "text_len": 2564, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "das inzwischen mehr als", "found": true}, {"type": "with", "string": "drei Millionen Aufrufe verzeichnet", "found": true}, {"type": "with", "string": "ist ein thail\u00e4ndischer Grab-Lieferfahrer zu sehen", "found": true}, {"type": "without", "string": "Lesen Sie auch", "found": false}, {"type": "without", "string": "Die Regierung braucht einen Notfallplan: Pita", "found": false}, {"type": "without", "string": "Than On beantragt Thai-ID-Card und Reisepass", "found": false}]}
{"file": "journal.3960.org.firefox.html", "url": "https://journal.3960.org/posts/2019-12-22-firefox-weniger-werbung-mehr-speed-unter-android/", "text_len": 2375, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Werbung nervt. Tracking nervt. Nerven nervt.", "found": true}, {"type": "with", "string": "Von seinem Vorg\u00e4nger unterscheidet", "found": true}, {"type": "with", "string": "nicht von mir benutzter Dienst", "found": true}, {"type": "without", "string": "Zur\u00fcck zur \u00dcbersichtsseite", "found": false}, {"type": "without", "string": "Merkw\u00fcrdige Erlebnisse, spontane Einf\u00e4lle", "found": false}, {"type": "without", "string": "Artikel mit dem Tag \"F\u00fcr Tumblr\"", "found": false}]}
{"file": "wordsmith.org.maudlin.html", "url": "https://wordsmith.org/words/maudlin.html", "text_len": 1434, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "adjective: Overly sentimental", "found": false}, {"type": "with", "string": "derived after a town on the Sea ", "found": true}, {"type": "with", "string": "Jeannette Layne-Clark; Minister on Stage; Daily Nation ", "found": true}, {"type": "without", "string": "spread the magic of words to readers everywhere", "found": false}, {"type": "without", "string": "\u201cA word in the head is worth two in the book.\u201d", "found": false}, {"type": "without", "string": "\u201cA trawl through the site\u2019s archive yields all kinds of delights.\u201d", "found": false}]}
{"file": "de.cointelegraph.com-CME.html", "url": "https://de.cointelegraph.com/news/cme-second-largest-bitcoin-futures-exchange-open-interest-surges", "text_len": 2232, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Chicago Mercantile Exchange (CME)", "found": true}, {"type": "with", "string": "eine regulierte Derivatb\u00f6rse", "found": true}, {"type": "with", "string": "liegt nun in Bezug auf das Open", "found": true}, {"type": "without", "string": "AUCH INTERESSANT", "found": false}, {"type": "without", "string": "CT EMPFIEHLT", "found": false}, {"type": "without", "string": "WERBEN SIE BEI UNS", "found": false}]}
{"file": "citylimits.org-Nycha.html", "url": "https://citylimits.org/2023/11/08/video-voting-on-nychas-future/", "text_len": 3442, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wednesday is a monumental day for the New York City", "found": true}, {"type": "with", "string": "Housing Authority and residents at the Nostrand Houses in Sheepshead Bay, Brooklyn", "found": true}, {"type": "with", "string": "For the first time, tenants will begin to vote", "found": true}, {"type": "without", "string": "LATEST ARTICLES", "found": false}, {"type": "without", "string": "more stories", "found": false}, {"type": "without", "string": "City Limits uses investigative journalism through the prism", "found": false}]}
{"file": "lernpfadprismen.wordpress.com.masse.html", "url": "https://lernpfadprismen.wordpress.com/masse/masse-des-quaders/", "text_len": 4076, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Masse eines K\u00f6rpers", "found": true}, {"type": "with", "string": "L\u00f6sung: m = 210 g", "found": true}, {"type": "with", "string": "Vollst\u00e4ndig durchgerechnete L\u00f6sung", "found": true}, {"type": "without", "string": "Bloggen auf WordPress.com", "found": false}, {"type": "without", "string": "Dieser Lernpfad ist", "found": false}, {"type": "without", "string": "Didaktischer Kommentar", "found": false}]}
{"file": "deleuze.enacademic.com.micropolitics.html", "url": "https://deleuze.enacademic.com/104/micropolitics", "text_len": 7349, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "The orchestration of desire", "found": true}, {"type": "with", "string": "Deleuze and Guattari oppose", "found": true}, {"type": "with", "string": "into itself the \ufb02ows", "found": true}, {"type": "without", "string": "noun The use of formal", "found": true}, {"type": "without", "string": "is professor emeritus of", "found": true}, {"type": "without", "string": "Merleau-Ponty, Maurice", "found": false}]}
{"file": "wolfsrebellen-netz.forumieren.com.regeln.html", "url": "https://wolfsrebellen-netz.forumieren.com/t7-forums-regeln", "text_len": 2832, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir pflegen hier ein sehr freundschaftliches", "found": true}, {"type": "with", "string": "Grafik, besonders der eigenen", "found": true}, {"type": "with", "string": "gez. Admin lupa", "found": true}, {"type": "without", "string": "Einen Missbrauch melden", "found": false}, {"type": "without", "string": "Widerruf des Lebensversicherungsvertrags vor oder nach", "found": false}, {"type": "without", "string": "Sie sind nicht verbunden", "found": false}]}
{"file": "bayrische-bembel.de.504.html", "url": "http://bayrische-bembel.de/bbr/modules/news/article.php?storyid=504", "text_len": 3237, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Axel Hellmann \u00fcbernimmt die", "found": true}, {"type": "with", "string": "Der Vorsitzende des Aufsichtsrat Wolfgang", "found": true}, {"type": "with", "string": "Saisonende bei Heribert Bruchhagen.", "found": true}, {"type": "without", "string": "Hier geht es zur neuen Vorstandsstruktur", "found": true}, {"type": "without", "string": "Nur f\u00fcr Bembel-Mitglieder", "found": false}, {"type": "without", "string": "Besucher sind online", "found": false}]}
{"file": "spontis.de.jahrzehnt.html", "url": "https://www.spontis.de/schwarze-szene/liebe-leser-bitte-rutschen-sie-nicht-in-das-neue-jahrzehnt/", "text_len": 3699, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wieso eigentlich einen guten", "found": true}, {"type": "with", "string": "Das Lithium-Ionen Akku", "found": true}, {"type": "with", "string": "Sie das neue Jahrzehnt", "found": true}, {"type": "without", "string": "Wizard of Goth", "found": false}, {"type": "without", "string": "Nossi: Belgien: Porta Nigra", "found": false}, {"type": "without", "string": "Soziale Netzwerke", "found": false}]}
{"file": "ihrwebprofi.at.publikumsvoting.html", "url": "https://www.ihrwebprofi.at/2011/09/17/publikumsvoting-beim-wiener-content-award-gestartet/", "text_len": 603, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Beim ContentAward.at, der", "found": true}, {"type": "with", "string": "Die \u201eToilet Map Vienna\u201e, die erste App", "found": true}, {"type": "with", "string": "Das Online-Voting l\u00e4uft von 14. September", "found": true}, {"type": "without", "string": "Kommentar hinzuf\u00fcgen", "found": false}, {"type": "without", "string": "Kategorie: News, open3", "found": false}, {"type": "without", "string": "Derzeit noch keine Kommentare", "found": false}]}
{"file": "harddecor.at.denkmaler.html", "url": "http://harddecor.at/work/denkmaler-neuem-licht/", "text_len": 1532, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "CONDITIONING. of Atmospheres in Architecture", "found": true}, {"type": "with", "string": "Denkmalpflegerinnen, Politikerinnen und der interessierten \u00d6ffentlichkeit f\u00f6rdern.", "found": true}, {"type": "with", "string": "Thema Planen und Bauen in historisch wertvoller Umgebung", "found": true}, {"type": "without", "string": "Best of 2016.", "found": false}, {"type": "without", "string": "Gegen Leerstand und Wertminderung.", "found": false}, {"type": "without", "string": "Mission Statement", "found": false}]}
{"file": "abc13.com-Copperfield.html", "url": "https://abc13.com/aishas-salon-and-spa-houston-lewd-act-man-pleasures-himself-on-camera-harris-county-sheriffs-office/14030671/", "text_len": 3359, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The Harris County Sheriff's Office is now", "found": true}, {"type": "with", "string": "investigating the incident at the salon chain's location in the Copperfield area.", "found": true}, {"type": "with", "string": "According to the owner, only female stylists are employed there", "found": true}, {"type": "without", "string": "Man admits to taking violating pics of women for months, police say", "found": false}, {"type": "without", "string": "Man was pleasuring himself inside HCC library, woman says", "found": false}, {"type": "without", "string": "Suspects robbed shoe store before chase ended in fiery crash, HPD says", "found": false}]}
{"file": "villagevoice.com-Party.html", "url": "https://www.villagevoice.com/party-like-its-1923-will-donald-trump-write-his-own-mein-kampf-in-jail/", "text_len": 8948, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Trump has been known to contradict himself", "found": true}, {"type": "with", "string": "in depositions, and when being grilled by the New York Attorney", "found": true}, {"type": "with", "string": "office on business fraud charges earlier this year", "found": true}, {"type": "without", "string": "The advertising disclaimer below does not apply to this article", "found": false}, {"type": "without", "string": "nor any originating from the Village Voice editorial department", "found": false}, {"type": "without", "string": "Advertising disclosure: We may receive compensation", "found": false}]}
{"file": "ndr.de.podcastcoronavirus140.html", "url": "https://www.ndr.de/nachrichten/info/16-Coronavirus-Update-Wir-brauchen-Abkuerzungen-bei-der-Impfstoffzulassung,podcastcoronavirus140.html", "text_len": 38095, "tp": 6, "fn": 0, "fp": 0, "tn": 5, "details": [{"type": "with", "string": "Das ist die zweith\u00f6chste von vier Stufen", "found": true}, {"type": "with", "string": "Die zentralen Fragen der Folge im \u00dcberblick", "found": true}, {"type": "with", "string": "Was sagt Professor Drosten dazu?", "found": true}, {"type": "with", "string": "Aus China.", "found": true}, {"type": "with", "string": "On-Off-Mechanismus", "found": true}, {"type": "with", "string": "Gerne. Bis morgen.", "found": true}, {"type": "without", "string": "Regelm\u00e4\u00dfig beantwortet Virus-Forscher", "found": false}, {"type": "without", "string": "Dieses Skript als PDF herunterladen", "found": false}, {"type": "without", "string": "Themen: Kritik aus dem Internet", "found": false}, {"type": "without", "string": "Was Sie zum Coronavirus wissen m\u00fcssen", "found": false}, {"type": "without", "string": "Drucken", "found": false}]}
{"file": "rent-a-salesman.eu.auslagern.html", "url": "https://www.rent-a-salesman.eu/den-vertrieb-auslagern-anders-als-andere-oder-gut-zu-wissen", "text_len": 1344, "tp": 2, "fn": 1, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Einen Vertriebsmitarbeiter ohne", "found": false}, {"type": "with", "string": "Wir wollen auch Provisionen", "found": true}, {"type": "with", "string": "Keine Excel-Sheets - sondern", "found": true}, {"type": "without", "string": "RENT A SALESMAN\u00ae", "found": false}, {"type": "without", "string": "Blog - Tag Cloud", "found": false}]}
{"file": "wildundhund.de-bonn.html", "url": "https://wildundhund.de/bonn-un-konvention-veroeffentlicht-empfehlungen-zur-vogelgrippe-und-zum-umgang-mit-wildvoegeln/", "text_len": 1219, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Arbeitsgruppe zur Vogelgrippe und zu", "found": true}, {"type": "with", "string": "Die CMS stellt fest, dass", "found": true}, {"type": "with", "string": "ungef\u00e4hrlichen Vogelgrippe festzustellen.", "found": true}, {"type": "without", "string": "Russland: Erstmalige Infektion", "found": false}, {"type": "without", "string": "VERWANDTE ARTIKEL", "found": false}, {"type": "without", "string": "NOCH MEHR WILD UND HUND", "found": false}]}
{"file": "biathlonword.com-chinesisch.html", "url": "https://www.biathlonworld.com/de/news", "text_len": 8368, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "kam die chinesische Damenstaffel viermal", "found": true}, {"type": "with", "string": "BMW IBU Weltcupgesamtwertung", "found": true}, {"type": "with", "string": "und eine solide Basis f\u00fcr die Weiterentwicklung", "found": true}, {"type": "without", "string": "BEIJING 2022 - CHINA STORY", "found": false}, {"type": "without", "string": "ABONNIERE UNSEREN NEWSLETTER", "found": false}, {"type": "without", "string": "OLYMPISCHE WINTERSPIELE", "found": false}]}
{"file": "vorangedacht.de.kohleausstieg.html", "url": "https://vorangedacht.de/umwelt-und-klima/ueber-kohleausstieg-kernkraftwerke-und-erneuerbare-energien/", "text_len": 12022, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Bundeswirtschaftsminister Habeck k\u00fcndigte", "found": true}, {"type": "with", "string": "Erneuerbare Energien sind volatil", "found": true}, {"type": "with", "string": "Eine \u00fcberw\u00e4ltigende Mehrzahl der Klimasch\u00fctzer", "found": true}, {"type": "without", "string": "Mehr zum Thema:", "found": false}, {"type": "without", "string": "Zum Newsletter anmelden", "found": true}, {"type": "without", "string": "Gr\u00fcnde f\u00fcr Atomkraftwerke", "found": true}]}
{"file": "resonator-podcast.de.res158.html", "url": "https://resonator-podcast.de/2019/res158-kathrin-goebel/", "text_len": 1795, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Kathrin G\u00f6bel (Twitter) ist", "found": true}, {"type": "with", "string": "Ver\u00f6ffentlicht am 16.08.2019", "found": true}, {"type": "with", "string": "Und bitte entschuldigt den Helium-Fehler ", "found": true}, {"type": "without", "string": "Mit diesem Button kannst Du", "found": true}, {"type": "without", "string": "Der Resonator-Podcast von Holger", "found": false}, {"type": "without", "string": "Etwa alle zwei Wochen erscheint ", "found": false}]}
{"file": "regiolanda.de.filmbuero.html", "url": "https://www.regiolanda.de/content/149-filmbuero-goettingen", "text_len": 3652, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "G\u00f6ttingen war in den 1950er Jahren", "found": true}, {"type": "with", "string": "Bedeutend f\u00fcr den Standort waren neben Ateliergesellschaf", "found": true}, {"type": "with", "string": "die Schlie\u00dfung des Instituts f\u00fcr den Wissenschaftlichen Film", "found": true}, {"type": "without", "string": "An der Aue 1", "found": false}, {"type": "without", "string": " Warenkorb", "found": false}, {"type": "without", "string": "2018 Regiolanda ", "found": false}]}
{"file": "bund-naturschutz.de-habeck.html", "url": "https://www.bund-naturschutz.de/pressemitteilungen/habeck-besuch-in-muenchen-windkraft-in-bayern-kann-nur-ohne-10-h-in-fahrt-gebracht-werden", "text_len": 1912, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "dass das Gespr\u00e4ch zwischen", "found": false}, {"type": "with", "string": "Wir appellieren an die Ampelkoalition, dies", "found": true}, {"type": "with", "string": "Bek\u00e4mpfung der Klimakrise verlieren", "found": true}, {"type": "without", "string": "Downloads", "found": false}, {"type": "without", "string": "Energiewende: BN stellt f\u00fcnf Kernforderungen", "found": false}, {"type": "without", "string": "Foto: Christof Stache", "found": false}]}
{"file": "coaching-magazin.de.transgenerationales-coaching.html", "url": "https://www.coaching-magazin.de/konzepte/transgenerationales-coaching", "text_len": 14212, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wer bin ich wirklich?", "found": true}, {"type": "with", "string": "Der Einfluss der Vererbung", "found": true}, {"type": "with", "string": "Entwicklungsreise", "found": true}, {"type": "without", "string": "Themen:", "found": false}, {"type": "without", "string": "Dieser Artikel gef\u00e4llt Ihnen?", "found": false}, {"type": "without", "string": "Haben Sie Fragen zum Coaching-Magazin?", "found": false}]}
{"file": "mobilsicher.de.icloud.html", "url": "https://mobilsicher.de/aktuelles/apple-kippt-verschluesselungsplaene-fuer-icloud", "text_len": 3024, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Medienberichten zufolge hat", "found": false}, {"type": "with", "string": "Anders sieht es bei den Daten aus", "found": true}, {"type": "with", "string": "Was dabei erstaunlich wenig Beachtung", "found": true}, {"type": "without", "string": "Wie Apple welche Daten", "found": false}, {"type": "without", "string": "30.01.2020 Wieso Updates?", "found": false}, {"type": "without", "string": "Weitere Artikel", "found": false}]}
{"file": "maescot.de.schafskunde.html", "url": "http://www.maescot.de/kleine-schafskunde/", "text_len": 2976, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Schaf, Standardausf\u00fchrung, wei\u00df", "found": false}, {"type": "with", "string": "Bei diesem arroganten Schafweibchen", "found": true}, {"type": "with", "string": "Eine Intellektuelle, die", "found": true}, {"type": "without", "string": "Der Webcomic mit den niedlichen Schafen", "found": false}, {"type": "without", "string": "\u00a9 2009-2012 Jonathan Krase", "found": false}, {"type": "without", "string": "\u2026und anderem Web 2.0 Ged\u00f6ns.", "found": false}]}
{"file": "elpais.com.ciencia.html", "url": "https://elpais.com/elpais/2020/02/18/ciencia/1582045946_459487.html", "text_len": 9629, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Que en la Ant\u00e1rtida se registren", "found": true}, {"type": "with", "string": "Este mediod\u00eda la Base", "found": true}, {"type": "with", "string": "y pasar\u00e1 a ser verde", "found": true}, {"type": "without", "string": "Puede escribirnos", "found": true}, {"type": "without", "string": "Un grupo de ping\u00fcinos", "found": false}, {"type": "without", "string": "El portal de empleo InfoJobs", "found": false}]}
{"file": "steinhau.com.zahlen.html", "url": "http://www.steinhau.com/steinhau/wordpress/einmal-zahlen-alles-lesen/", "text_len": 24248, "tp": 4, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Hinweis: Der nachfolgende Artikel mitsamt der telefonisch", "found": true}, {"type": "with", "string": "Der Ruf nach einer Flatrate", "found": true}, {"type": "with", "string": "sowohl in der Browser-Version als auch in der App", "found": true}, {"type": "with", "string": "Zugang zu einer Zielgruppe erm\u00f6glicht", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Deine E-Mail-Adresse wird nicht", "found": false}, {"type": "without", "string": "um Spam zu reduzieren", "found": false}, {"type": "without", "string": "Alle Rechte beim Autoren", "found": false}]}
{"file": "dvg.de.weihnachtsurlaub.html", "url": "https://www.dvfg.de/presse/pressemeldung/2022/11/29/verbrauchertipp-an-oder-aus-so-heizen-sie-waehrend-des-weihnachtsurlaubs-effizient", "text_len": 4348, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Weihnachten ist Reisezeit", "found": true}, {"type": "with", "string": "Thermostate runterdrehen,", "found": true}, {"type": "with", "string": " Smarten Thermostaten die Steuerung \u00fcberlassen", "found": false}, {"type": "without", "string": "zur\u00fcck zur Listenansicht", "found": false}, {"type": "without", "string": " 2022 Deutscher Verband Fl\u00fcssiggas e.V.", "found": false}, {"type": "without", "string": "Kontakt", "found": false}]}
{"file": "harrypotter.fandom.com.spell.html", "url": "https://harrypotter.fandom.com/wiki/Water-Making_Spell", "text_len": 7090, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\"The Water-Making Spell conjures clean, drinkable water from", "found": true}, {"type": "with", "string": "A jet of water flew out of the umbrella tip", "found": true}, {"type": "with", "string": "Hermione used this charm to extinguish his burning eyebrows", "found": true}, {"type": "without", "string": "Take your favorite fandoms with you and never miss a beat.", "found": false}, {"type": "without", "string": "What is your opinion on people becoming obsessed with Draco?", "found": false}, {"type": "without", "string": "Harry Potter Wiki is a FANDOM Movies Community.", "found": false}]}
{"file": "emotion.de.selfcare.html", "url": "https://www.emotion.de/psychologie-partnerschaft/persoenlichkeit/selfcare-fuer-faule-99-wege-dein-selbstbewusstsein-aufzupaeppeln", "text_len": 9094, "tp": 1, "fn": 2, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Jeden Morgen eine stundenlange Beauty-Routine", "found": false}, {"type": "with", "string": "\"Ich nehme mir regelm\u00e4\u00dfig Zeit und Ruhe", "found": false}, {"type": "with", "string": "Dir selbst Blumen", "found": true}, {"type": "without", "string": "Mehr Themen:", "found": true}, {"type": "without", "string": "BELIEBTE THEMEN ENTDECKEN", "found": false}, {"type": "without", "string": "\u00dcBER", "found": false}]}
{"file": "theintercept.com-Gaza.html", "url": "https://theintercept.com/2023/11/08/gaza-hospitals-babies-doctors-patients/", "text_len": 13042, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The shortages led to what in the West", "found": true}, {"type": "with", "string": "would be unthinkable decisions", "found": true}, {"type": "with", "string": "choosing between patients who", "found": true}, {"type": "without", "string": "U.S. Weapons Transfers to Israel Shrouded in Secrecy \u2014 but Not Ukraine", "found": false}, {"type": "without", "string": "Inside the Biden White House, Doubts About Gaza War Are Beginning to Creep In", "found": false}, {"type": "without", "string": "GOP Representative Denies Existence", "found": false}]}
{"file": "oetker.de.bienenstich.html", "url": "https://www.oetker.de/rezepte/r/bienenstich-muffins", "text_len": 2539, "tp": 4, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Saftig-weiche Muffins aus Hefeteig", "found": false}, {"type": "with", "string": "f\u00fcr das Rezept Bienenstich-Muffins", "found": true}, {"type": "with", "string": "Dr. Oetker Vanillin-Zucker", "found": true}, {"type": "with", "string": "Belag:", "found": false}, {"type": "with", "string": "Hei\u00dfluft etwa 180 \u00b0C", "found": true}, {"type": "with", "string": "ein gro\u00dfes Brett legen.", "found": true}, {"type": "without", "string": "Merken", "found": false}, {"type": "without", "string": "Verwendete Dr. Oetker Produkte", "found": false}, {"type": "without", "string": "(24 Rezepte)", "found": false}]}
{"file": "nmb-media.de.ebay.html", "url": "https://shop.nmb-media.de/eBay-Template-Datenschutz-Google-Fonts-Fontawesome", "text_len": 1900, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Aus datenschutzrechtlichen Gr\u00fcnden wird", "found": true}, {"type": "with", "string": "Aufgrund der derzeitigen, datenschutzrechtlichen", "found": true}, {"type": "with", "string": "Die IP-Adressen werden", "found": true}, {"type": "without", "string": "Die Beratung zu den von uns angebotenen", "found": false}, {"type": "without", "string": "Fernwartung nach Absprache per AnyDesk", "found": false}, {"type": "without", "string": "Bitte laden Sie sich \u00fcber Ihr ", "found": true}]}
{"file": "elle.de.sneaker.html", "url": "https://www.elle.de/plateau-sneaker-trend", "text_len": 1458, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "am meisten getragenen Lieblingsteilen in deiner Garderobe", "found": true}, {"type": "with", "string": "Die L\u00f6sung f\u00fcr diese modische Herausforderung liegt in der", "found": true}, {"type": "with", "string": "So geht die Tendenz nach Dad Sneaker und Ugly Sneaker", "found": true}, {"type": "without", "string": "Net Sustain: Die neue Plattform von", "found": false}, {"type": "without", "string": "Zum Shop", "found": false}, {"type": "without", "string": "Affiliatelink", "found": false}]}
{"file": "statisticsglobe.com.ggplot2.html", "url": "https://statisticsglobe.com/change-font-size-of-ggplot2-plot-in-r-axis-text-main-title-legend", "text_len": 6852, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "explain how to increase and decrease the text", "found": true}, {"type": "with", "string": "y = Probability", "found": true}, {"type": "with", "string": "If you have any further questions, please", "found": true}, {"type": "without", "string": "Get regular updates on the latest tutorials", "found": false}, {"type": "without", "string": "On this website, I provide statistics tutorials", "found": false}, {"type": "without", "string": "Related Tutorials", "found": false}]}
{"file": "thw.de-frauen.html", "url": "https://www.thw.de/SharedDocs/Meldungen/DE/Meldungen/national/2021/10/meldung_01_miniserie_frauen_im_thw/meldung_001_startseite_miniserie_frauen_im_thw.html", "text_len": 2699, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "heute f\u00fcr Frauen ist und wie", "found": true}, {"type": "with", "string": "nahezu allen Gesellschaften und Kulturen", "found": true}, {"type": "with", "string": "\u201eCool, \u2018ne Frau in", "found": true}, {"type": "without", "string": "Mehr zum Ereignis", "found": false}, {"type": "without", "string": "Das THW in Ihrer", "found": false}, {"type": "without", "string": "Alle Termine", "found": false}]}
{"file": "awo.org-Menschenrechte.html", "url": "https://www.awo.org/menschenrechte-achten", "text_len": 2271, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gesundheitsversorgung gew\u00e4hren und", "found": true}, {"type": "with", "string": "Gefl\u00fcchtete brauchen einen", "found": true}, {"type": "with", "string": "Dies gelingt durch einen", "found": true}, {"type": "without", "string": "Aktionstag Suchtberatung.", "found": false}, {"type": "without", "string": "Suchtberatung wirkt", "found": false}, {"type": "without", "string": "Klassismus in", "found": false}]}
{"file": "incurvy.de.wellness.html", "url": "https://www.incurvy.de/trends-grosse-groessen/wellness-gesichtsbehandlung-plaisir-daromes/", "text_len": 8747, "tp": 4, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Zeit f\u00fcr Loslassen und Entspannung.", "found": true}, {"type": "with", "string": "Erfrischende, abschwellende Augencreme Phyto Contour", "found": true}, {"type": "with", "string": "Wie sieht dein Alltag aus?", "found": true}, {"type": "with", "string": "Vielen Dank Anja f\u00fcr deine Tipps rund um Beauty", "found": true}, {"type": "without", "string": "Das Thema k\u00f6nnte dich auch interessieren:", "found": true}, {"type": "without", "string": "Betreiberin von incurvy Plus Size", "found": false}, {"type": "without", "string": "Wir verwenden Cookies", "found": false}]}
{"file": "happyface313.com.plantur.html", "url": "https://happyface313.com/2018/03/07/im-test-plantur-39-color-braun-phyto-coffein-shampoo-und-pflege-spulung/", "text_len": 5700, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Als ich neulich eine Anfrage erhielt", "found": true}, {"type": "with", "string": "Shampoo und Sp\u00fclung werden in einer dunkelbrauen", "found": true}, {"type": "with", "string": "und meine Haare sahen gesund", "found": true}, {"type": "without", "string": "Teilen mit:", "found": false}, {"type": "without", "string": "Follow Blog via Email", "found": false}, {"type": "without", "string": "Vollst\u00e4ndiges Profil anzeigen", "found": false}]}
{"file": "pronats.de.arbeit.html", "url": "https://www.pronats.de/informationen/kindheit-und-arbeit/kinder-und-arbeit/", "text_len": 10618, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nicht die Arbeit ist f\u00fcr die", "found": true}, {"type": "with", "string": "Wir bestehen deshalb darauf", "found": true}, {"type": "with", "string": "Einmal begleiteten wir eine", "found": true}, {"type": "without", "string": "Als NATs bezeichnen sich die", "found": false}, {"type": "without", "string": "Texte auf dieser Webseite stehen unter einer", "found": false}, {"type": "without", "string": "ProNATs - Verein zur Unterst\u00fctzung arbeitender", "found": false}]}
{"file": "she-works.de.sport.html", "url": "https://www.she-works.de/aktuelles/5-inspirierende-frauen-aus-der-sportwelt/2022/12/29/ ", "text_len": 4691, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die amerikanische Profi-Surferin", "found": true}, {"type": "with", "string": "Wenn wir schon beim Snowboarden", "found": true}, {"type": "with", "string": "Diese Legende und Powerfrau darf wohl", "found": true}, {"type": "without", "string": "Schlagw\u00f6rter", "found": false}, {"type": "without", "string": "E-Magazin", "found": false}, {"type": "without", "string": "SHE!", "found": false}]}
{"file": "grossefragen.wordpress.com.projekt.html", "url": "https://grossefragen.wordpress.com/2019/03/13/wuerde-des-lebens-ein-projekt/", "text_len": 5642, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dieses Thema eignet", "found": true}, {"type": "with", "string": "Dabei gelten ein paar wichtige", "found": true}, {"type": "with", "string": "=> Wie hast Du gelernt?", "found": true}, {"type": "without", "string": "Unterrichtsideen und die Bilder", "found": false}, {"type": "without", "string": "f\u00fcr erfolgreiches Lernen", "found": false}, {"type": "without", "string": "142 Antworten zu", "found": false}]}
{"file": "0b66696af800472190a76b26faa845d4.html", "url": "https://jungefreiheit.de/debatte/kommentar/2019/kaisers-royaler-wochenrueckblick-31/", "text_len": 4299, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Im Interview mit dem Sportportal", "found": true}, {"type": "with", "string": "Ist \u00d6zil ein verkappter Feingeist?", "found": true}, {"type": "with", "string": "nicht f\u00fcr einen Rosenkranz h\u00e4lt.", "found": true}, {"type": "without", "string": "Der n\u00e4chste Beitrag", "found": false}, {"type": "without", "string": "Die Kommentarfunktion wird 2 Tage nach Ver\u00f6ffentlichungsdatum des Beitrages geschlossen.", "found": false}, {"type": "without", "string": "Meistkommentiert", "found": false}]}
{"file": "womencantalksports.com-top10.html", "url": "http://www.womencantalksports.com/top-10-women-talking-sports/", "text_len": 2935, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "begin a series highlighting", "found": true}, {"type": "with", "string": "5. Kristi Dosh", "found": true}, {"type": "with", "string": "I really love what", "found": true}, {"type": "without", "string": "Submit your sports", "found": false}, {"type": "without", "string": "Twitter Talk", "found": false}, {"type": "without", "string": "So Much Math in Football?", "found": false}]}
{"file": "spektrum.de.engelbart.html", "url": "https://scilogs.spektrum.de/engelbart-galaxis/die-ablehnung-der-gendersprache/", "text_len": 10461, "tp": 2, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Zweitens wird der Genderstern", "found": true}, {"type": "with", "string": "alldem leider \u2013 nichts.", "found": true}, {"type": "without", "string": "Originalbeitrag", "found": false}, {"type": "without", "string": "Spektrum.de Newsletter", "found": false}, {"type": "without", "string": "Beitragsbild", "found": true}]}
{"file": "infobae.com-ucrania.html", "url": "https://www.infobae.com/america/mundo/2022/05/03/el-nobel-de-la-paz-ruso-dmitry-muratov-advirtio-que-el-regimen-de-vladimir-putin-podria-utilizar-armas-nucleares-en-ucrania/", "text_len": 4079, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "El periodista sostuvo que eso supondr\u00eda \u201cel fin", "found": false}, {"type": "with", "string": "advirtiendo que eso supondr\u00eda\u201c", "found": false}, {"type": "with", "string": "un poder absoluto y sin restricciones\u201d.", "found": true}, {"type": "without", "string": "TEMAS RELACIONADOS", "found": false}, {"type": "without", "string": "Muratov, tras el ataque sufrido a principios", "found": false}, {"type": "without", "string": "Premio Nobel de la Paz (REUTERS/Denis Balibouse)", "found": false}]}
{"file": "deutsche-wirtschafts-nachrichten.de-Industriestrompreis.html", "url": "https://deutsche-wirtschafts-nachrichten.de/706332/industriestrompreis-kein-ende-der-debatte?src=live", "text_len": 1966, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bundeswirtschaftsminister Robert Habeck", "found": true}, {"type": "with", "string": " die Industrie und die Gewerkschaft IG Metall", "found": false}, {"type": "with", "string": "dringen auf ein schnelles Ja f\u00fcr einen verbilligten Strompreis", "found": false}, {"type": "without", "string": "Experte: Energiepreise werden weiter steigen", "found": false}, {"type": "without", "string": "Standort Deutschland \u2013 zu gro\u00dfes Gesch\u00e4ftsrisiko?", "found": false}, {"type": "without", "string": "Unverbindliches aus dem Hause Habeck", "found": false}]}
{"file": "novalanalove.com.ear-candy.html", "url": "https://novalanalove.com/ear-candy/", "text_len": 1179, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Earcuff: Zoeca", "found": true}, {"type": "with", "string": "mit l\u00e4ngeren Ohrringen (:", "found": true}, {"type": "with", "string": "Kreole: Stella Hoops", "found": true}, {"type": "without", "string": "Jetzt hei\u00dft es schnell sein:", "found": false}, {"type": "without", "string": "Diese Website speichert Cookies", "found": false}, {"type": "without", "string": "VON Sina Giebel", "found": false}]}
{"file": "piratenpartei-marburg.de.fridays.html", "url": "https://www.piratenpartei-marburg.de/2019/09/21/wir-unterstuetzen-fridays-for-future/", "text_len": 702, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Ignoranz, mit der die Dringlichkeit tiefgreifender \u00c4nderungen", "found": true}, {"type": "with", "string": "Diese Seite war gestern nicht erreichbar", "found": true}, {"type": "with", "string": "Die Ignoranz, mit der die Dringlichkeit", "found": true}, {"type": "without", "string": "Klarmachen zum \u00c4ndern!", "found": false}, {"type": "without", "string": "Von allein wird es nicht besser!", "found": false}, {"type": "without", "string": "Copyright \u00a9 2020 Piratenpartei", "found": false}]}
{"file": "archive.org.the-pain.net.silkroad.html", "url": "https://web.archive.org/web/20130307194448/the-pain.net/2008/05/silkroad-roc-mountain-quests-und-npcs.html", "text_len": 7147, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich wurde von vielen Leuten darum gebeten zum neuen", "found": true}, {"type": "with", "string": "man kann ja nicht alles wissen", "found": true}, {"type": "with", "string": "Bringe eine Nachricht \u00fcber den vermissten Sohn zu", "found": true}, {"type": "without", "string": "Silkroad Online und alle damit in Verbindung stehenden Logos", "found": false}, {"type": "without", "string": "2007 - 2013", "found": false}, {"type": "without", "string": "Alle anderen Warenzeichen oder", "found": false}]}
{"file": "pawszilla.com.celine.html", "url": "https://pawszilla.com/pop-culture/celebrities/fans-expressed-fears-celine-dions-appearance-savagely-responded/21/", "text_len": 28437, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Even though C\u00e9line Dion is a multi-million-selling", "found": true}, {"type": "with", "string": "So this led to the star coming clean to her critics in spectacular fashion.", "found": true}, {"type": "with", "string": "Her most iconic looks of the 1990s", "found": true}, {"type": "without", "string": "Getty Images", "found": false}, {"type": "without", "string": "Staff Writer", "found": false}, {"type": "without", "string": "Battery Media Group", "found": false}]}
{"file": "lsvd.de-afghanistan.html", "url": "https://www.lsvd.de/de/ct/6520-Erste-Zusagen-fuer-Aufnahmen-von-ueber-80-LSBTI-aus-Afghanistan", "text_len": 4840, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir begr\u00fc\u00dfen die mehr als 80 Aufnahmezusagen", "found": true}, {"type": "with", "string": "vom Ausw\u00e4rtigen Amt bei der Familienzusammenf\u00fchrung", "found": true}, {"type": "with", "string": "Situation verschiedener Personengruppen", "found": true}, {"type": "without", "string": "Pressesprecher*in Markus Ulrich", "found": false}, {"type": "without", "string": "zust\u00e4ndiges Vorstandsmitglied", "found": false}, {"type": "without", "string": "Der Lesben- und Schwulenverband (LSVD) ist", "found": false}]}
{"file": "lacuarta.com-loretoaravena.html", "url": "https://www.lacuarta.com/espectaculos/noticia/va-y-agarra-las-llaves-de-su-cartera-destapan-pelea-a-grito-pelado-entre-loreto-aravena-y-pancha-merino-en-pasillos-de-canal-13/I7QCHL6HAZCBBIROIOUNHFGB5I/", "text_len": 2474, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "protagoniz\u00f3 Loreto Aravena y Pancha", "found": true}, {"type": "with", "string": "hasta el camar\u00edn del Bienvenidos.", "found": true}, {"type": "with", "string": "alegando que le ocupan el estacionamiento\u201d", "found": true}, {"type": "without", "string": "COMPARTIR NOTA", "found": false}, {"type": "without", "string": "TEMAS RELACIONADOS", "found": false}, {"type": "without", "string": "Stella a Francisca en Pobre Novio", "found": false}]}
{"file": "missy-magazine.de-interabled.html", "url": "https://missy-magazine.de/blog/2023/10/30/interabled-sex-education/", "text_len": 9217, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Sex ist immer schon etwas anderes als es selbst.", "found": true}, {"type": "with", "string": "M\u00fcssen wir verstehen, was wir begehren?", "found": true}, {"type": "with", "string": "Wo f\u00e4ngt die Lust an und wer entscheidet", "found": true}, {"type": "without", "string": "Vertr\u00e4ge k\u00fcndigen", "found": false}, {"type": "without", "string": "weitere Artikel", "found": false}, {"type": "without", "string": "K\u00f6rper&Sex", "found": false}]}
{"file": "ejwue.de.lieferketten.html", "url": "https://www.ejwue.de/aktuell/news/faire-lieferketten/", "text_len": 3002, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Deshalb l\u00e4dt der EJW-Weltdienst zusammen", "found": true}, {"type": "with", "string": "Das Evangelische Jugendwerk in W\u00fcrttemberg", "found": true}, {"type": "with", "string": "koordiniert, f\u00f6rdert und gestaltet", "found": true}, {"type": "without", "string": "Haeberlinstra\u00dfe 1-3", "found": false}, {"type": "without", "string": "Kontaktieren Sie uns gerne auch direkt", "found": false}, {"type": "without", "string": "kalte Welt herein leuchten", "found": false}]}
{"file": "tagesspiegel.de.abstandsregeln.html", "url": "https://www.tagesspiegel.de/wirtschaft/abstandsregeln-und-fieberkontrollen-wie-firmen-ihre-beschaeftigten-vor-dem-coronavirus-schuetzen/25784520.html", "text_len": 7253, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Ideen reichen vom Spuckschutz bis zur Kontrolle d", "found": false}, {"type": "with", "string": "Heil mahnte: Besorgt ausreichend Seife und Desinfektionsmittel!", "found": true}, {"type": "with", "string": "Das Liefergesch\u00e4ft mit Hotels, das die H\u00e4lfte des Umsatzes ausmachte, ist weggebrochen", "found": true}, {"type": "without", "string": "Diskutieren Sie mit!", "found": false}, {"type": "without", "string": "Meistdiskutiert", "found": false}, {"type": "without", "string": "Login", "found": false}]}
{"file": "archive.org.he.xinhuanet.com.25340717.html", "url": "https://web.archive.org/web/20120611024252/http://www.he.xinhuanet.com/news/2012-06/04/content_25340717.htm", "text_len": 2967, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u4e00\u4e2a\u7ea6\u5b9a\uff0c\u4fe1\u5b8815\u5e74\uff0c\u611f\u4eba\u81f3\u6df1\uff1b\u4e00\u6bb5\u771f\u60c5\uff0c\u5ef6\u7eed15\u5e74", "found": false}, {"type": "with", "string": "\u79e6\u7687\u5c9b\u3001\u627f\u5fb7\u3001\u5f20\u5bb6\u53e3\u7b4910\u4e2a\u8bbe\u533a\u5e02\u6f14\u51fa(\u6b64\u524d\u5df2\u5728\u4fdd\u5b9a\u5e02\u6f14\u51fa\u591a\u573a)\uff0c\u5f15\u8d77\u5f3a\u70c8\u53cd\u54cd\u3002", "found": false}, {"type": "with", "string": "\u5982\u4eca\uff0c\u5411\u6cb3\u5317\u519c\u5927\u679c\u681193(01)\u73ed\u6bd5\u4e1a\u751f\u7fa4\u4f53\u5b66\u4e60\u7684\u70ed\u6f6e\u6b63\u5728\u5168\u7701\u5404\u5730\u6df1\u5165\u5f00\u5c55\u3002\u5eca\u574a\u4ee5\u5de1\u6f14\u4e3a", "found": false}, {"type": "without", "string": "copyright (c) 2000", "found": false}, {"type": "without", "string": "ICP\u8bc1010042\u53f7", "found": false}, {"type": "without", "string": "\u6cb3\u5317\u63a2\u7d22\u519c\u6751\u52b3\u52a8\u529b\u5c31\u5730\u5c31\u8fd1\u8f6c\u79fb\u57f9\u8bad", "found": false}]}
{"file": "scienceblogs.de-zufaellig.html", "url": "https://scienceblogs.de/mathlog/2023/11/06/muenzwuerfe-sind-nicht-zufaellig/", "text_len": 1668, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Alles ist im Prinzip berechenbar", "found": true}, {"type": "with", "string": "Zufall entsteht nur durch unvollst\u00e4ndige Information", "found": true}, {"type": "with", "string": "Der Wurf einer M\u00fcnze ist nicht zuf\u00e4llig", "found": true}, {"type": "without", "string": "Neueste Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Top Posts from WordPress stats", "found": false}, {"type": "without", "string": "ScienceBlogs ist ein gesch\u00fctztes Markenzeichen.", "found": false}]}
{"file": "latimes.com.bloomberg.html", "url": "https://www.latimes.com/politics/story/2020-02-19/mike-bloomberg-democratic-debate-history", "text_len": 7393, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "a lot of explaining.", "found": true}, {"type": "with", "string": "His opponents don\u2019t lack for material to use.", "found": true}, {"type": "with", "string": "floating above the fray", "found": true}, {"type": "without", "string": "The latest news, analysis and insights", "found": false}, {"type": "without", "string": "writes about a broad range", "found": false}, {"type": "without", "string": "California loosens its individual mandate", "found": false}]}
{"file": "mesopinions.com.mutilation.html", "url": "https://www.mesopinions.com/petition/art-culture/mutilation-choeur-radio-france-unique-choeur/76519", "text_len": 3019, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "National de France et du Philharmonique de Radio France.", "found": true}, {"type": "with", "string": "bien des promesses non tenues par des directions successives", "found": true}, {"type": "with", "string": "vide de toute ambition artistique et culturelle.", "found": true}, {"type": "without", "string": "Notre communaut\u00e9", "found": false}, {"type": "without", "string": "Espace presse", "found": false}, {"type": "without", "string": "R\u00e9ussir votre mobilisation", "found": false}]}
{"file": "football.ua.podolski.html", "url": "https://football.ua/germany/311510-podolski-zavershil-kareru-v-sbornojj.html", "text_len": 1222, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u043b\u0435\u0442\u043d\u0438\u0439 \u041b\u0443\u043a\u0430\u0448 \u041f\u043e\u0434\u043e\u043b\u044c\u0441\u043a\u0438 \u2013 \u0442\u0440\u0435\u0442\u0438\u0439 \u043f\u043e \u043a\u043e\u043b\u0438\u0447\u0435\u0441\u0442\u0432\u0443 \u043c\u0430\u0442\u0447\u0435\u0439 \u0437\u0430 \u0441\u0431\u043e\u0440\u043d\u0443\u044e", "found": true}, {"type": "with", "string": "\u042d\u043a\u0441-\u0438\u0433\u0440\u043e\u043a \u0410\u0440\u0441\u0435\u043d\u0430\u043b\u0430 \u0438 \u0411\u0430\u0432\u0430\u0440\u0438\u0438 \u043f\u043e\u043f\u0430\u043b \u0432 \u0437\u0430\u044f\u0432\u043a\u0443", "found": true}, {"type": "with", "string": "\u0420\u0435\u0448\u0435\u043d\u0438\u0435 \u0434\u0430\u043b\u043e\u0441\u044c \u043c\u043d\u0435 \u043e\u0447\u0435\u043d\u044c \u0442\u044f\u0436\u0435\u043b\u043e. \u0421\u0431\u043e\u0440\u043d\u0430\u044f \u0432\u0441\u0435\u0433\u0434\u0430 \u0431\u044b\u043b\u0430", "found": true}, {"type": "without", "string": "\u00a9 2006-2019 \u041e\u041e\u041e \"\u0412\u0418\u0414\u0410\u0412\u041d\u0418\u0426\u0422\u0412\u041e \u0423\u041a\u0420\u0410\u0407\u041d\u0421\u042c\u041a\u0418\u0419 \u041c\u0415\u0414\u0406\u0410 \u0414\u0406\u041c\". \u0412\u0441\u0435 \u043f\u0440\u0430\u0432\u0430 \u0437\u0430\u0449\u0438\u0449\u0435\u043d\u044b.", "found": false}, {"type": "without", "string": "\u041f\u043e\u043b\u0438\u0442\u0438\u043a\u0430 \u0432 \u0441\u0444\u0435\u0440\u0435 \u043a\u043e\u043d\u0444\u0438\u0434\u0435\u043d\u0446\u0438\u0430\u043b\u044c\u043d\u043e\u0441\u0442\u0438 \u0438 \u043f\u0435\u0440\u0441\u043e\u043d\u0430\u043b\u044c\u043d\u044b\u0445 \u0434\u0430\u043d\u043d\u044b\u0445", "found": false}, {"type": "without", "string": "\u0413\u0435\u0440\u043c\u0430\u043d\u0438\u044f. \u041d\u043e\u0432\u043e\u0441\u0442\u0438", "found": false}]}
{"file": "24horas.cl-segundo.html", "url": "https://www.24horas.cl/politica/presidente-boric-inicia-gira-por-magallanes-este-miercoles-5287894", "text_len": 3185, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "joven jefe del Estado, al que apenas se", "found": true}, {"type": "with", "string": "mundial, arrastrada por la guerra en Europa", "found": true}, {"type": "with", "string": "Armada por el \"Mes del Mar\", retomar el pulso", "found": true}, {"type": "without", "string": "condonaci\u00f3n progresiva del CAE", "found": false}, {"type": "without", "string": "Kiss se present\u00f3 por", "found": false}, {"type": "without", "string": "M\u00c1S SE\u00d1ALES EN VIVO", "found": false}]}
{"file": "franziska-elea.de.vuitton.html", "url": "http://www.franziska-elea.de/2019/02/10/das-louis-vuitton-missgeschick/", "text_len": 4271, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zuerst dachte ich, ich k\u00f6nnte das", "found": true}, {"type": "with", "string": "x Franzi", "found": true}, {"type": "with", "string": "Flauschjacke: Bershka", "found": true}, {"type": "without", "string": "Palm Springs Mini (links)", "found": false}, {"type": "without", "string": "Diese Website verwendet Akismet", "found": false}, {"type": "without", "string": "New York, New York", "found": false}]}
{"file": "heise.de.lithium.html", "url": "https://www.heise.de/newsticker/meldung/Lithium-aus-dem-Schredder-4451133.html", "text_len": 2220, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die \u00d6kobilanz von Elektroautos", "found": true}, {"type": "with", "string": "Nur die Folie bleibt zur\u00fcck", "found": true}, {"type": "without", "string": "TR 7/2019", "found": false}, {"type": "without", "string": "Forum zum Thema:", "found": false}, {"type": "without", "string": "Highlights aus dem Heft:", "found": false}]}
{"file": "silvias.net.wahlzensur.html", "url": "http://www.silvias.net/blog/wahlzensur-angriff-auf-universitaeten/", "text_len": 3135, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Am 25. Oktober gab es", "found": true}, {"type": "with", "string": "Der Oberste Wahlgerichtshof", "found": true}, {"type": "with", "string": "At\u00e9 agora tiveram", "found": true}, {"type": "without", "string": "alle inhalte @silviajura", "found": false}, {"type": "without", "string": "CAPTCHA Code", "found": false}, {"type": "without", "string": "Primavera feminista em Viena", "found": false}]}
{"file": "1hundetagebuch.wordpress.com.langer.html", "url": "https://1hundetagebuch.wordpress.com/2019/10/31/nach-viel-zu-langer-zeit-mal-wieder/", "text_len": 2564, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich k\u00f6nnte glatt ein schlechtes Gewissen", "found": true}, {"type": "with", "string": "So muss Mesty jetzt Pillen nehmen", "found": true}, {"type": "with", "string": "Vielleicht muss man die Dosis des", "found": true}, {"type": "without", "string": "Share this:", "found": false}, {"type": "without", "string": "Kommentar verfassen", "found": false}, {"type": "without", "string": "Ein Blog \u00fcber die Abenteue", "found": false}]}
{"file": "siegfried-marcus-berufsschule.at.kft.html", "url": "https://www.siegfried-marcus-berufsschule.at/kraftfahrzeugtechnik/lehrberufe-kft-2/", "text_len": 100980, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Lehrstoffinhalte", "found": true}, {"type": "with", "string": "3. Klasse", "found": true}, {"type": "with", "string": "Module", "found": true}, {"type": "without", "string": "Direktor: OSR Dipl.-P\u00e4d. Markus Fuchs", "found": false}, {"type": "without", "string": "Verein der Freunde f\u00fcr berufsbegleitende Aus- und ", "found": false}, {"type": "without", "string": "Obmann: OSR Markus Fuchs", "found": false}]}
{"file": "Winda w chmurach _ Obyczaje _ Dwutygodnik _ Dwutygodnik.html", "url": "https://www.dwutygodnik.com/artykul/9491-winda-w-chmurach.html", "text_len": 9461, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ludzie ci", "found": true}, {"type": "with", "string": "Aleksandra Zbroja przedstawia si\u0119", "found": false}, {"type": "with", "string": "Mireczka, i bez niego.", "found": true}, {"type": "without", "string": "11 minut czytania", "found": false}, {"type": "without", "string": "Historyczka nowoczesnej kultury polskiej", "found": false}, {"type": "without", "string": "IWONA KURZ", "found": false}]}
{"file": "fdpbt.de-epidemischenLage.html", "url": "https://www.fdpbt.de/beendigung-epidemischen-lage-nationaler-tragweite", "text_len": 2623, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Lage von nationaler Tragweite", "found": true}, {"type": "with", "string": "erste Fraktion gewesen", "found": true}, {"type": "with", "string": "Das Konzeptpapier", "found": true}, {"type": "without", "string": "Mit unserem Newsletter", "found": false}, {"type": "without", "string": "Artikel", "found": false}, {"type": "without", "string": "Twitter", "found": false}]}
{"file": "freshideen.com-Stollenfest.html", "url": "https://freshideen.com/rezepte/dresdner-stollenfest.html", "text_len": 5233, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir eher nicht!", "found": true}, {"type": "with", "string": "Denn der ber\u00fchmte Kuchen mit Rosinen", "found": true}, {"type": "with", "string": "Marzipan oder Schokolade geh\u00f6rt einfach zum Fest", "found": true}, {"type": "without", "string": "Verwandte Artikel", "found": false}, {"type": "without", "string": "Kalorienarmes Tiramisu mit viel Protein f\u00fcr sportich aktive Personen", "found": false}, {"type": "without", "string": "Schnelles Abendessen \u2013 2 Blitzrezepte f\u00fcr einen angenehmen Feierabend", "found": false}]}
{"file": "speicherguide.de.schwierige.html", "url": "https://www.speicherguide.de/digitalisierung/faktor-mensch/schwierige-gespraeche-so-gehts-24376.aspx", "text_len": 317, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Konflikte mag keiner.", "found": true}, {"type": "with", "string": "Gespr\u00e4che meistern k\u00f6nnen.", "found": true}, {"type": "without", "string": "Weiterf\u00fchrender Link", "found": false}, {"type": "without", "string": "Flexible Wege in die", "found": false}]}
{"file": "befifty.montauk.html", "url": "https://www.befifty.de/home/2017/7/12/unter-uns-montauk", "text_len": 5241, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Im kurzen BeFifty Video", "found": true}, {"type": "with", "string": "Und hier einige Impressionen", "found": true}, {"type": "with", "string": "bodenst\u00e4ndig und stilsicher", "found": true}, {"type": "without", "string": "Um Ihnen ein besseres Nutzererlebnis", "found": false}, {"type": "without", "string": "auf Linie gebracht", "found": false}, {"type": "without", "string": "Tumblr", "found": false}]}
{"file": "urania.de.freiheit.html", "url": "https://www.urania.de/die-freiheit-der-planung", "text_len": 7364, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Was haben fahrerlose Autos und Pakete ", "found": true}, {"type": "with", "string": "\u00d6ffentliche R\u00e4ume sind", "found": true}, {"type": "with", "string": "St\u00e4dtebau ist planungsrechtlich die Art", "found": true}, {"type": "without", "string": "Diese Seite teilen", "found": false}, {"type": "without", "string": "Blog", "found": false}, {"type": "without", "string": "Cookie-Einstellungen", "found": false}]}
{"file": "OnlineMarketing.de-Instagram.html", "url": "https://onlinemarketing.de/social-media-marketing/instagram-neue-videofunktion-stories", "text_len": 95, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nutzer:innen haben die M\u00f6glichkeit", "found": false}, {"type": "with", "string": "ein bis zu 15 Sekunden langes Video mit ihrem Smartphone aufzunehmen", "found": false}, {"type": "with", "string": "und danach \u00fcber Instagram in ihren Stories hochzuladen.", "found": false}, {"type": "without", "string": "Dein personalisierter Newsletter", "found": false}, {"type": "without", "string": "Whitepaper kostenlos downloaden", "found": false}, {"type": "without", "string": "Webinare zu digitalen Themen", "found": false}]}
{"file": "juraforum.de-Wohngeld.html", "url": "https://www.juraforum.de/recht-gesetz/ohne-ernsthafte-bewerbungsbemuehungen-kein-wohngeld-722430", "text_len": 2075, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Verwaltungsgericht hielt die ablehnenden Wohngeldentscheidung", "found": true}, {"type": "with", "string": "Standort abgelehnt, ohne jedoch", "found": true}, {"type": "with", "string": "Er habe aber keinerlei ernsthaften", "found": true}, {"type": "without", "string": "KOMMENTAR SCHREIBEN", "found": false}, {"type": "without", "string": "Lexware f\u00fcr Unternehmer", "found": false}, {"type": "without", "string": "BISHERIGE KOMMENTARE ZUR", "found": false}]}
{"file": "piratenpartei-mv.de.grundeinkommen.html", "url": "https://piratenpartei-mv.de/blog/2013/09/12/grundeinkommen-ist-ein-menschenrecht/", "text_len": 1327, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Unter diesem Motto findet am 14. September", "found": true}, {"type": "with", "string": "Volksinitiative Schweiz zum Grundeinkommen.", "found": true}, {"type": "without", "string": "getaggt mit:", "found": false}, {"type": "without", "string": "Was denkst du?", "found": false}]}
{"file": "link.springer.com.1007.html", "url": "https://link.springer.com/article/10.1007/s11926-017-0626-z", "text_len": 16242, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The purpose of the review is to summarise", "found": true}, {"type": "with", "string": "The most commonly reported drugs are allopurinol", "found": true}, {"type": "with", "string": "Kirchhof MG, Wong A, Dutz JP. Cyclosporine treatment", "found": true}, {"type": "without", "string": "Immediate online access to all issues from 2019.", "found": false}, {"type": "without", "string": "\u00a9 2020 Springer Nature Switzerland AG", "found": false}, {"type": "without", "string": "Instant access to the full article PDF.", "found": false}]}
{"file": "wirtschaftspsychologie-aktuell.de.starken.html", "url": "https://wirtschaftspsychologie-aktuell.de/magazin/fuehrung/staerkenorientierte-fuehrung ", "text_len": 6754, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "St\u00e4rkenorientierte F\u00fchrung", "found": true}, {"type": "with", "string": "Rund zwei Millionen Stellen", "found": true}, {"type": "with", "string": "Positive Leadership l\u00e4sst sich s", "found": true}, {"type": "without", "string": "Zum Weiterlesen:", "found": true}, {"type": "without", "string": "Shared, Plural oder Dual Leadership:", "found": false}, {"type": "without", "string": "2022 Deutscher Psychologen Verlag GmbH", "found": false}]}
{"file": "pcmag.com.platters.html", "url": "https://www.pcmag.com/news/next-gen-hamr-platters-promise-80tb-hard-drives", "text_len": 2272, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "but the path looks clear to scale up to 80TB.", "found": false}, {"type": "with", "string": "hat means an 80TB hard drive is theoretically possible.", "found": true}, {"type": "with", "string": "per square inch. Based on to", "found": true}, {"type": "without", "string": "nd a Masters in Computer Games Development from Abertay University.", "found": false}, {"type": "without", "string": "Read the latest from Matthew Humphries", "found": false}, {"type": "without", "string": "Honest, Objective Reviews", "found": false}]}
{"file": "autosprint.ch-pistenstopp.html", "url": "https://www.autosprint.ch/de/classic/histo-monte-pistenstopp-in-rheinfelden/", "text_len": 2179, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Histo-Monte stehen gut. Die", "found": true}, {"type": "with", "string": "gesperrte historische Stadtbr\u00fccke benutzten", "found": true}, {"type": "with", "string": "fr\u00fcherer Veranstaltungen zur Verf\u00fcgung", "found": true}, {"type": "without", "string": "Beitr\u00e4ge zum Thema", "found": false}, {"type": "without", "string": "Respekt vor dem", "found": false}, {"type": "without", "string": "Erinnerung an den", "found": false}]}
{"file": "elespectador.com-orion.html", "url": "https://www.elespectador.com/judicial/asi-seran-los-tres-macrocasos-que-abrira-la-jep/", "text_len": 6839, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "contra la naturaleza ser\u00e1n parte de las investigaciones", "found": false}, {"type": "with", "string": "El 09, en las violencias que sufrieron los pueblos \u00e9tnicos", "found": true}, {"type": "with", "string": "macrocaso, pero se apart\u00f3 de exigencias m\u00e1s duras", "found": true}, {"type": "without", "string": "Desvinculan al general (r) Leonardo Barrero", "found": false}, {"type": "without", "string": "Le puede interesar", "found": true}, {"type": "without", "string": "Mejor calidad de vida con gas natural", "found": false}]}
{"file": "gizmeo.eu.insekten.html", "url": "https://gizmeo.eu/makrophotos-von-insekten/", "text_len": 780, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Alle seine Photos entstanden", "found": true}, {"type": "with", "string": "Eine Ameise in einer Bar!", "found": true}, {"type": "with", "string": "Echt sch\u00f6n bzw. bitte", "found": true}, {"type": "without", "string": "Relevantes aus dem gizmeo.eu-Archiv:", "found": false}, {"type": "without", "string": "keine Ahnung mehr wie es...", "found": false}, {"type": "without", "string": "\u00a9 2010-2020 gizmeo.eu", "found": false}]}
{"file": "lostiempos.com-juicio.html", "url": "https://www.lostiempos.com/actualidad/pais/20220503/juicio-caso-golpe-ii-entra-recta-final-sentencia-podria-dictarse-este", "text_len": 2537, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "La audiencia que podr\u00eda ser decisiva", "found": true}, {"type": "with", "string": "de Sentencia Anticorrupci\u00f3n de La Paz fij\u00f3", "found": true}, {"type": "with", "string": "condena de tres a\u00f1os de c\u00e1rcel", "found": true}, {"type": "without", "string": "Valora esta noticia", "found": false}, {"type": "without", "string": "sentencia y presenta recurso al TCP", "found": false}, {"type": "without", "string": "abogados en el juicio por el caso \u201cgolpe\u201d.", "found": false}]}
{"file": "teslamag.de-Musk.html", "url": "https://teslamag.de/news/musk-firma-xai-modell-nutzung-tesla-computer-moeglich-62317", "text_len": 3296, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Grok sei als k\u00fcnstliche Intelligenz dem Buch", "found": true}, {"type": "with", "string": "Per Anhalter durch die Galaxis", "found": true}, {"type": "with", "string": "also dazu gedacht, fast jegliche Fragen zu beantworten und sogar selbst Fragen vorzuschlagen", "found": true}, {"type": "without", "string": "NEUESTE BEITR\u00c4GE", "found": false}, {"type": "without", "string": "Widerspr\u00fcchliche Daten: Tesla-Fahrer haben", "found": false}, {"type": "without", "string": "laut Auswertung in USA die meisten Unf\u00e4lle", "found": false}]}
{"file": "echte-demokratie-jetzt.de.blog.html", "url": "http://www.echte-demokratie-jetzt.de/blog/", "text_len": 11932, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Liebe Menschen Europas", "found": true}, {"type": "with", "string": "Dieses Werk bzw. Inhalt", "found": false}, {"type": "with", "string": "\u0391\u03b3\u03b1\u03c0\u03b7\u03c4\u03ad \u03bb\u03b1\u03ad \u03c4\u03b7\u03c2 \u0395\u03c5\u03c1\u03ce\u03c0\u03b7\u03c2", "found": true}, {"type": "without", "string": "von anderen", "found": false}, {"type": "without", "string": "Du h\u00f6rst es oft.", "found": false}, {"type": "without", "string": "Eine Filmempfehlung f\u00fcr die", "found": false}]}
{"file": "disfunctions.de.podcasts.html", "url": "https://disfunctions.de/tutorials/podcasts-in-plex-einbinden/", "text_len": 1530, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich benutze jetzt seit l\u00e4ngerem", "found": true}, {"type": "with", "string": "filename=$1", "found": true}, {"type": "with", "string": "DOWNLOAD_DIRECTORY", "found": true}, {"type": "without", "string": "Erstellt am Dienstag 6. Mai 2014", "found": false}, {"type": "without", "string": "Das Blog der gnadenlosen Fehlfunktionen!", "found": false}, {"type": "without", "string": "Design von Andreas Viklund", "found": false}]}
{"file": "nestle-family-com-chicken.html", "url": "https://www.nestle-family.com/en/recipes/roasted-chicken-oriental-rice", "text_len": 386, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "1 large or 1200 g whole", "found": true}, {"type": "with", "string": "1 tablespoon ground", "found": true}, {"type": "with", "string": "cups or 1125 ml of", "found": true}, {"type": "without", "string": "NEW AND EXCITING SIMILAR", "found": false}, {"type": "without", "string": "Like recipe?", "found": true}, {"type": "without", "string": "basket and deliver to you", "found": true}]}
{"file": "hildesheimer-presse.de-hund.html", "url": "https://hildesheimer-presse.de/2023/11/01/hund-vertreibt-einbrecher-zeugenaufruf/", "text_len": 1003, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nach aktuellem Kenntnisstand", "found": true}, {"type": "with", "string": "schlug der Hund des Hausbewohners zur o. g. Zeit pl\u00f6tzlich an", "found": true}, {"type": "with", "string": "Als der Bewohner nach dem Rechten schauen wollte", "found": true}, {"type": "without", "string": "Beliebte Artikel", "found": false}, {"type": "without", "string": "Ambulante Notfallpraxis der KVN Hildesheim", "found": false}, {"type": "without", "string": "Nummer gegen Kummer", "found": false}]}
{"file": "omr.com-Schuhbrand.html", "url": "https://omr.com/de/daily/cowboyboots-und-crocs", "text_len": 8536, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "W\u00e4hrend Birkenstocks aber im Vergleich zum Crocs", "found": true}, {"type": "with", "string": "der gewisse Funfaktor fehle", "found": true}, {"type": "with", "string": "sagt Landowski, bringe man Crocs nicht mit den typischen Birkenstocks-Attributen", "found": true}, {"type": "without", "string": "Empfohlener redaktioneller Inhalt", "found": false}, {"type": "without", "string": "Aktuelle Stories und die wichtigsten News f\u00fcr Marketeers direkt in dein Postfach!", "found": false}, {"type": "without", "string": "OMR Family Member", "found": false}]}
{"file": "Raptastisch.net-Seitenhieb.html", "url": "https://raptastisch.net/2023/11/06/bushido-antwortet-auf-seitenhieb-von-azad-und-erklaert-ihn-fuer-finished/", "text_len": 2264, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Azad war mein Vorbild, doch ist innerlich am Sack", "found": true}, {"type": "with", "string": "Weil er mit f\u00fcnfzig Jahren nichts au\u00dfer Erinnerungen hat", "found": true}, {"type": "with", "string": "Ich half ihm bis zum letzten Satz wie einem Onkel", "found": true}, {"type": "without", "string": "Kranke Zahlen \u2013 Bushido f\u00fchrt im privaten Verkaufsbattle gegen Bonez MC", "found": false}, {"type": "without", "string": "Nie wieder \u2013 Fard gibt Statement zu Farid Bang ab", "found": false}, {"type": "without", "string": "Raptastisch auf Facebook", "found": false}]}
{"file": "hr-innovation.org.enterprise.html", "url": "http://www.hr-innovation.org/hr-innovation-einer-enterprise-2-0/", "text_len": 3429, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Clayton M. Christensen", "found": true}, {"type": "with", "string": "You can\u2019t solve a problem", "found": true}, {"type": "with", "string": "Nur zu selten tritt", "found": true}, {"type": "without", "string": "Copyright \u00a9 2020", "found": false}, {"type": "without", "string": "Geben Sie Ihre E-Mail", "found": false}, {"type": "without", "string": "Initiative zur Entwicklung", "found": false}]}
{"file": "Finowie odkrywaj\u0105 wino _ Res Publica Nowa.html", "url": "https://publica.pl/teksty/rafalska-finowie-odkrywaja-wino-68379.html", "text_len": 10163, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nie mog\u0105c konkurowa\u0107", "found": true}, {"type": "with", "string": "W Finlandii obowi\u0105zuje", "found": true}, {"type": "with", "string": "koncepcj\u0119 \u201ezero waste\u201d", "found": true}, {"type": "without", "string": "marca 2021", "found": false}, {"type": "without", "string": "Rozmowa z dr nauk", "found": false}, {"type": "without", "string": "Wino lepsze od", "found": false}]}
{"file": "larepublica.pe-minedu.html", "url": "https://larepublica.pe/datos-lr/respuestas/2022/05/02/cronograma-minedu-2022-cuando-seran-las-vacaciones-escolares-atmp/", "text_len": 6849, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "y semipresencial el \u00faltimo 28 de marzo", "found": true}, {"type": "with", "string": "a fin de mejorar las estad\u00edsticas vinculadas al avance", "found": true}, {"type": "with", "string": "compartir alimentos ni utensilios.", "found": true}, {"type": "without", "string": "Quiniela de HOY, s\u00e1bado 7 de mayo: resultados", "found": false}, {"type": "without", "string": "Son tres los periodos de vacaciones durante", "found": false}, {"type": "without", "string": "PUEDES VER: \u00bfQu\u00e9 es la Sunedu,", "found": true}]}
{"file": "jan-grosser.de.xum1541.html", "url": "http://www.jan-grosser.de/art/385_xum1541_dateien_zwischen_linux.html", "text_len": 7221, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Es gibt verschiedene M\u00f6glichkeiten", "found": true}, {"type": "with", "string": "Die Hardware f\u00fcr den XUM1541", "found": true}, {"type": "with", "string": "Das Innenleben des Geh\u00e4uses", "found": true}, {"type": "without", "string": "If not explicitly specified otherwise", "found": false}, {"type": "without", "string": "cat /dev/brain/ideas >> blog", "found": false}]}
{"file": "blog.teufel.de.leistung.html", "url": "https://blog.teufel.de/musik-und-sport-so-steigern-songs-deine-leistung/", "text_len": 5462, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wenn das Lieblingslied im Radio", "found": true}, {"type": "with", "string": "Hier stellen wir dir einige spannende Fakten dazu vor", "found": true}, {"type": "with", "string": "Playlists, die dich zum Schwitzen bringen", "found": true}, {"type": "without", "string": "Alles \u00fcber Lautsprecher, Heimkino", "found": false}, {"type": "without", "string": "In diesem Blog schreiben Teufel-Kollegen", "found": false}, {"type": "without", "string": "Newsletter abonnieren und 10\u20ac", "found": false}]}
{"file": "theguardian.com.academics.html", "url": "https://www.theguardian.com/education/2020/jan/20/thousands-of-uk-academics-treated-as-second-class-citizens", "text_len": 3648, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "It calls on the", "found": true}, {"type": "with", "string": "But a spokesperson for", "found": true}, {"type": "without", "string": "Available for everyone, funded by readers", "found": false}, {"type": "without", "string": "Make a contribution", "found": false}, {"type": "without", "string": "Striking members of the UCU", "found": false}]}
{"file": "motor1.de-erwischt.html", "url": "https://de.motor1.com/news/545242/bmw-3er-touring-2022-erwischt/", "text_len": 2742, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "eine der beliebtesten", "found": true}, {"type": "with", "string": "3er-Facelifts mit den", "found": true}, {"type": "with", "string": "werden, die auf der in China,", "found": true}, {"type": "without", "string": "Die besten Leasing-Deals", "found": false}, {"type": "without", "string": "Ein Service von", "found": false}, {"type": "without", "string": "Fiat 500 Leasing f\u00fcr 55 Euro", "found": false}]}
{"file": "ambito.com-paritarias.html", "url": "https://www.ambito.com/politica/paritarias/al-rojo-gremios-la-alimentacion-marcan-inflacion-53-abril-y-amenazan-paro-n5431248", "text_len": 3172, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "sindicato ir\u00e1 hoy a una audiencia", "found": true}, {"type": "with", "string": "cerr\u00f3 en 52,7% y en base", "found": true}, {"type": "with", "string": "Se trata de un informe interno que", "found": true}, {"type": "without", "string": "Temas", "found": true}, {"type": "without", "string": "Suscribite a nuestro", "found": false}, {"type": "without", "string": "Informate m\u00e1s", "found": false}]}
{"file": "piratenpartei-hessen.de.nachbarschaftshilfe.html", "url": "https://www.piratenpartei-hessen.de/blog/2020/03/31/solidaritaet-nachbarschaftshilfe/", "text_len": 1211, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "anbieten und ihren Beitrag leisten,", "found": true}, {"type": "with", "string": "Wohle der Allgemeinheit riskieren. Auch die zahlreichen privaten Initiativen", "found": true}, {"type": "with", "string": "ng der Corona-Schutzma\u00dfnahmen und gegenseitiger Solidarit\u00e4t auf", "found": true}, {"type": "without", "string": "0 Piratenpartei Hes", "found": false}, {"type": "without", "string": "Bundesschiedsgericht", "found": false}, {"type": "without", "string": "vKV Kassel Stadt-Land-Web", "found": false}]}
{"file": "lopinion.fr.glyphosate.html", "url": "https://www.lopinion.fr/edition/economie/glyphosate-radiographie-d-intoxication-collective-186859", "text_len": 7362, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "La firme Bayer, propri\u00e9taire", "found": false}, {"type": "with", "string": "Jackpot pour Monsanto qui vend \u00e0 la fois les semences", "found": true}, {"type": "with", "string": "puisque le champ des recherches est infini...", "found": true}, {"type": "without", "string": "Mentions l\u00e9gales", "found": false}, {"type": "without", "string": "Conditions g\u00e9n\u00e9rales de vente", "found": false}, {"type": "without", "string": "Charte des commentaires", "found": false}]}
{"file": "finanztreff.de-Influencer.html", "url": "http://www.finanztreff.de/realtimenews/influencer-und-trading-apps-die-jungen-entdecken-die-boerse/24437626", "text_len": 4636, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "informieren sich bei Instagram", "found": true}, {"type": "with", "string": "ausschlie\u00dflich Einzelaktien ins Depot.", "found": true}, {"type": "with", "string": "Die Kan\u00e4le hei\u00dfen \u00abAktien mit Kopf\u00bb", "found": true}, {"type": "without", "string": "Krypto-Hot-Stock mit 60%", "found": false}, {"type": "without", "string": "MIDDAY BRIEFING - Unternehmen", "found": false}, {"type": "without", "string": "Weitere Nachrichten", "found": false}]}
{"file": "parcoabruzzo.it.58354.html", "url": "http://www.parcoabruzzo.it/dettaglio.php?id=58354", "text_len": 4126, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Il risultato \u00e8 molto positivo", "found": true}, {"type": "with", "string": "naturali di regolazione numerica", "found": true}, {"type": "with", "string": "In questo contesto \u00e8 chiaro", "found": true}, {"type": "without", "string": "Grafico conta femmine con", "found": true}, {"type": "without", "string": "Tel. 0863/91131 - Fax 0863/912132", "found": false}, {"type": "without", "string": "Autore di Parks.it", "found": false}]}
{"file": "sportowefakty.wp.pl.falubaz.html", "url": "https://sportowefakty.wp.pl/zuzel/relacja/110331/fogo-unia-leszno-rm-solar-falubaz-zielona-gora", "text_len": 12625, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zn\u00f3w lepszy moment startowy miejscowych, lecz", "found": true}, {"type": "with", "string": "W Lesznie zacz\u0105\u0142 mocno pada\u0107 deszcz.", "found": true}, {"type": "with", "string": "Stadion im. Alfreda Smoczyka w Lesznie", "found": true}, {"type": "without", "string": "\u00a9 1995-2020 Grupa WP", "found": false}, {"type": "without", "string": "Polskie gwiazdy", "found": false}, {"type": "without", "string": "Zobacz r\u00f3wnie\u017c", "found": false}]}
{"file": "gipfelbuch.ch-hochaufloesung.html", "url": "https://www.gipfelbuch.ch/outdoornews/detail/id/718", "text_len": 6453, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Um einen ersten Eindruck zu erhalten", "found": true}, {"type": "with", "string": "hilft uns in den Satellitendaten", "found": true}, {"type": "with", "string": " Zusammengefasst ber\u00fccksichtigen wir in", "found": true}, {"type": "without", "string": "Abbildung: Vergleich auf dem Aletschgletscher", "found": false}, {"type": "without", "string": "FRAGEN AN DEN AUTOR", "found": false}, {"type": "without", "string": "Farblich codierte Schneeh\u00f6hendarstellung", "found": false}]}
{"file": "achgut.com-coronalage.html", "url": "https://www.achgut.com/artikel/bericht_zur_coronalage_vom_22.04.2020_worauf_wartet_die_politik", "text_len": 17237, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Noch nicht offiziell ist die Zahl", "found": true}, {"type": "with", "string": "Wie schwer ist die Krankheit", "found": true}, {"type": "with", "string": "Wahlumfrage, Wahlprognose", "found": true}, {"type": "without", "string": "Sie lesen gern Achgut.com?", "found": false}, {"type": "without", "string": "schnell & einfach einen Boot-Stick", "found": false}, {"type": "without", "string": "Sensationelles Urteil f\u00fcr Dieselfahrer", "found": false}]}
{"file": "tonight.de-Arschloch.html", "url": "https://www.tonight.de/unterhaltung/promis/daniela-buechner-danni-und-ennesto-monte-trennen-sich-arschloch_114240.html", "text_len": 3053, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "gescheitert\u201c, schrieb der 46-J\u00e4hrige.", "found": true}, {"type": "with", "string": "einem halben Jahr", "found": true}, {"type": "with", "string": "Danni B\u00fcchner hat derweil ihren", "found": true}, {"type": "without", "string": "Foto: Instagram", "found": false}, {"type": "without", "string": "Wegen Corona:", "found": true}, {"type": "without", "string": "Promis", "found": false}]}
{"file": "leichtathletik-berlin.de-norddeutschland.html", "url": "https://www.leichtathletik-berlin.de/pressemitteilungen_reader/norddeutschland-sucht-seine-meister.html", "text_len": 2995, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Goldrausch auf den 1500 Metern", "found": true}, {"type": "with", "string": "Altersklasse souver\u00e4n auf den 60m", "found": true}, {"type": "with", "string": "den 2. Platz erreichen.", "found": true}, {"type": "without", "string": "Gisele Wender", "found": true}, {"type": "without", "string": "Sponsoren", "found": false}, {"type": "without", "string": "Pressemitteilungen", "found": true}]}
{"file": "volksblatt.at-Alkoholkonsum.html", "url": "https://volksblatt.at/chronik/oesterreich/oesterreich-tranken-pro-kopf-111-liter-alkohol-im-jahr-822151/", "text_len": 2363, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Spitzenreiter Lettland f\u00fchrt das Ranking dabei mit 12,2 Litern pro Kopf an", "found": true}, {"type": "with", "string": "Der OECD-Schnitt liegt dagegen bei 8,6 Litern pro Kopf", "found": true}, {"type": "with", "string": "Der OECD-Bericht \u201eHealth at a Glance\u201c erfasst regelm\u00e4\u00dfig zahlreiche Daten zum Zustand", "found": true}, {"type": "without", "string": "DAS K\u00d6NNTE SIE AUCH INTERESSIEREN", "found": false}, {"type": "without", "string": "OMV verliert Beteiligung an russischem Gasfeld", "found": false}, {"type": "without", "string": "Signa verkauft Chrysler Building und Medienbeteiligungen", "found": false}]}
{"file": "hss.de-Regierung.html", "url": "https://www.hss.de/news/detail/grosse-aufgaben-fuer-die-neue-regierung-news8123/", "text_len": 18533, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Najla Bouden ist die", "found": false}, {"type": "with", "string": "Tunesier landesweit die", "found": true}, {"type": "with", "string": "tunesische Bev\u00f6lkerung durchaus in einer", "found": true}, {"type": "without", "string": "Naher Osten, Nordafrika", "found": false}, {"type": "without", "string": "Bourguiba, Tunis.", "found": false}, {"type": "without", "string": "Ahmed Zarrouki, Avenue Hbib", "found": false}]}
{"file": "berliner-feuerwehr.de-Ehrenzeichen.html", "url": "https://www.berliner-feuerwehr.de/aktuelles/nachrichten/feuerwehr-und-katastrophenschutz-ehrenzeichen-verliehen-3896/", "text_len": 2223, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Ehrenzeichen der Stufe 1", "found": true}, {"type": "with", "string": "Landesbranddirektor Dr. Karsten Homrighausen", "found": true}, {"type": "with", "string": "Kameradinnen und Kameraden erhielten", "found": true}, {"type": "without", "string": "Kameradinnen und Kameraden erhielten", "found": true}, {"type": "without", "string": "\u201eRed levens\u201c - Leben retten", "found": false}, {"type": "without", "string": "Zum Seitenanfang", "found": false}]}
{"file": "bmz.de-schulze.html", "url": "https://www.bmz.de/de/aktuelles/aktuelle-meldungen/schulze-deutschland-an-der-der-seite-wfp-im-kampf-gegen-hunger-103026", "text_len": 3006, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "tragen auch der Klima\u00adwandel", "found": false}, {"type": "with", "string": "Fast f\u00fcnf Millionen Menschen", "found": true}, {"type": "with", "string": "Alleine im letzten Jahr", "found": true}, {"type": "without", "string": "Sonderinitiative EINEWELT", "found": false}, {"type": "without", "string": "SDG 2: Kein Hunger", "found": false}, {"type": "without", "string": "Siehe auch", "found": false}]}
{"file": "mitvergnuegen.de.herbst.html", "url": "https://mitvergnuegen.com/2022/ausflug-herbst-um-berlin/", "text_len": 7904, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zugegeben, wir", "found": true}, {"type": "with", "string": "Am Werbellinsee gibt", "found": true}, {"type": "with", "string": "Raus aus den Klamotten und rein", "found": true}, {"type": "without", "string": "DIESE ARTIKEL K\u00d6NNTEN DICH INTERESSIEREN", "found": false}, {"type": "without", "string": "ZUR\u00dcCK ZUR STARTSEITE", "found": false}, {"type": "without", "string": "Kategorien", "found": false}]}
{"file": "kinzig.news-Nachhaltigkeit.html", "url": "https://kinzig.news/23578/das-steckt-dahinter-nachhaltigkeit-bei-der-spessart-tourismus-gmbh", "text_len": 8520, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Auf den Tourismus bezogen ist Nachhaltigkeit f\u00fcr uns", "found": true}, {"type": "with", "string": "dass wir die Entwicklung in der Region mit allen Leistungstr\u00e4gern", "found": true}, {"type": "with", "string": "die an der touristischen Wertsch\u00f6pfungskette beteiligt sind", "found": true}, {"type": "without", "string": "MEHR ZUM THEMA", "found": false}, {"type": "without", "string": "Digitalisierung im Forst: Das sind die Chancen und Herausforderungen", "found": false}, {"type": "without", "string": "Naturschutzbeamter Lukas Rippl und Revierleiterin Manuela Gebhard zeigen", "found": false}]}
{"file": "deviante-pfade.de.unbefriedigt.html", "url": "https://www.deviante-pfade.de/unbefriedigt/", "text_len": 4504, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir alle haben Bed\u00fcrfnisse. Mal mehr", "found": true}, {"type": "with", "string": "Die Situationen, in denen man unbefriedigt", "found": true}, {"type": "with", "string": "Ich denke, dass bei mir auch durch den neu", "found": true}, {"type": "without", "string": "R\u00fcckblick auf das Blog-Jahr 2019", "found": false}, {"type": "without", "string": "Durch die weitere Nutzung der Seite", "found": false}, {"type": "without", "string": "Orgasmuskontrolle und Sexentzug", "found": false}]}
{"file": "auto-presse.de-minisuv.html", "url": "https://auto-presse.de/autonews.php?newsid=6486285", "text_len": 1321, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "wenige Wochen nach", "found": true}, {"type": "with", "string": "1,5-Liter-Hybridantrieb", "found": true}, {"type": "with", "string": "Mit dem demn\u00e4chst", "found": true}, {"type": "without", "string": "Top Meldungen", "found": false}, {"type": "without", "string": "Mazda fertigt flexibler", "found": false}, {"type": "without", "string": "f\u00fcr dynamische Fortbewegung", "found": false}]}
{"file": "anglerboard.de-rute.html", "url": "https://anglerboard.de/ams/raubfisch-rute-im-test-die-iaconelli-spinning-rod.434/", "text_len": 8646, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Classic-Gewinner Mike \"IKE\" Iaconelli", "found": true}, {"type": "with", "string": "ist f\u00fcr jeden Spinnangler hier die", "found": true}, {"type": "with", "string": "Zuerst ging es f\u00fcr mich aufs Boot, um", "found": true}, {"type": "without", "string": "Kategorie Catch more fish", "found": false}, {"type": "without", "string": "Pulse Realistic Softbaits - wie echt!", "found": false}, {"type": "without", "string": "Diesen Artikel teilen", "found": false}]}
{"file": "hrjournal.de.trends.html", "url": "https://www.hrjournal.de/fuenf-hr-trends-2023/", "text_len": 5448, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Auch wenn Mitarbeitende Zusch\u00fcsse", "found": true}, {"type": "with", "string": "Doch sollten Arbeitgeber nicht selbstgef\u00e4llig", "found": true}, {"type": "with", "string": "Unternehmen, ganz gleich welcher", "found": true}, {"type": "without", "string": "Lesen Sie auch die folgenden Beitr\u00e4ge:", "found": true}, {"type": "without", "string": "Zur Person", "found": false}, {"type": "without", "string": "Die Zusammenarbeit und F\u00fchrung von Teams", "found": false}]}
{"file": "pythonspeed.com.docker.html", "url": "https://pythonspeed.com/articles/pipenv-docker/", "text_len": 7072, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "CMD flask run exampleapp:app", "found": true}, {"type": "with", "string": "The takeaway", "found": true}, {"type": "with", "string": "Install dependencies separately and earlier in your Dockerfile to ensure faster builds.", "found": false}, {"type": "without", "string": "Learn how to build fast, production-ready Docker images\u2014read the rest of ", "found": false}, {"type": "without", "string": "You need to stay competitive in the job market\u2014but there", "found": false}, {"type": "without", "string": "Next: Elegantly activating a virtualenv in a Dockerfile", "found": false}]}
{"file": "thelocal.se.tattooed.html", "url": "https://www.thelocal.se/20200428/meet-the-swede-who-tattooed-a-state-epidemiologists-face-on-his-arm", "text_len": 2308, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "epidemiologist Anders Tegnell has become a household name", "found": false}, {"type": "with", "string": "to get the tattoo after Tastas advertised the design", "found": true}, {"type": "with", "string": "Asked about the tattoo last week by newspaper GP", "found": true}, {"type": "without", "string": "to leave a comment", "found": false}, {"type": "without", "string": "Advertisement", "found": false}, {"type": "without", "string": "The latest news about the coronavirus outbreak", "found": false}]}
{"file": "martinruetter.com-Winter.html", "url": "https://www.martinruetter.com/service/aktuelles/aktuelles/schneefloeckchen-weissroeckchen-mit-hund-im-winter/", "text_len": 5799, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Spaziergang in geschlossener Schneedecke", "found": false}, {"type": "with", "string": "M\u00fcssen Hunde im Winter auch Schneeschuhe", "found": true}, {"type": "with", "string": "Wichtig bei allen Trainingsstunden", "found": true}, {"type": "without", "string": "Martin R\u00fctter DOGS", "found": true}, {"type": "without", "string": "Umgang mit dem", "found": false}, {"type": "without", "string": "HUNDESCHULEN", "found": false}]}
{"file": "eurailpress.de-rekordniveau.html", "url": "https://www.eurailpress.de/nachrichten/unternehmen-maerkte/detail/news/hafen-goeteborg-umschlag-auf-rekordniveau.html", "text_len": 724, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bahnshuttles zur\u00fcckzuf\u00fchren, die den Hafen", "found": true}, {"type": "with", "string": "Der Hafen rechnet wegen des Ausbaus des", "found": true}, {"type": "with", "string": "unter anderem auf die Einf\u00fchrung", "found": true}, {"type": "without", "string": "Redaktion Eurailpress", "found": false}, {"type": "without", "string": "Artikel", "found": false}, {"type": "without", "string": "Unternehmen & M\u00e4rkte", "found": false}]}
{"file": "unendlich-viel-energie-strompreisbremse.html", "url": "https://www.unendlich-viel-energie.de/themen/strom/umfrage-zur-strompreisbremse-oekostromkundinnen-besonders-sensibel-fuers-stromsparen", "text_len": 3402, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "D\u00fcsseldorf, 22. November 2022 -", "found": true}, {"type": "with", "string": "\u201eDie gro\u00dfe Mehrheit der Bev\u00f6lkerung", "found": true}, {"type": "with", "string": "Das Marktforschungsunternehmen YouGov", "found": true}, {"type": "without", "string": "Diesen Artikel teilen", "found": false}, {"type": "without", "string": "Newsletter November", "found": false}, {"type": "without", "string": "Suche", "found": false}]}
{"file": "rheinruhronline.de.essenwestviertel.html", "url": "https://www.rheinruhronline.de/essen/essen2/essenwestviertel/essenwestviertel.htm", "text_len": 9219, "tp": 2, "fn": 1, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Essen-Westviertel Ehemaliges Press- und", "found": false}, {"type": "with", "string": "geringe Wohnbebauung auf", "found": true}, {"type": "with", "string": "Colosseum Theater Essen", "found": true}, {"type": "without", "string": "- Anzeige-", "found": false}, {"type": "without", "string": "N\u00fctzliche Apps und Services", "found": false}]}
{"file": "netzfueralle.blog.rosalux.de.netzpolitik.html", "url": "https://netzfueralle.blog.rosalux.de/2019/10/30/netzpolitik-als-us-wahlkampfthema/", "text_len": 6044, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Radikal-reformistischer Vorschlag", "found": true}, {"type": "with", "string": "I am a capitalist. Come on", "found": true}, {"type": "with", "string": "Was die Problemwahrnehmung angeht", "found": true}, {"type": "without", "string": "Vorstudie zur Men\u00fcerweiterung durch FOSS-Produkte bei der RLS", "found": false}, {"type": "without", "string": "Smarte Worte", "found": false}, {"type": "without", "string": "Netz f\u00fcr Alle bei Facebook", "found": false}]}
{"file": "parallels.com.desktop.html", "url": "https://www.parallels.com/products/desktop/", "text_len": 12995, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Quickly move files, apps and more", "found": true}, {"type": "with", "string": "#1 choice of Mac Users", "found": true}, {"type": "with", "string": "Visual Studio plug-In", "found": true}, {"type": "without", "string": "\u00a9 1999-2020 Parallels", "found": false}, {"type": "without", "string": "Parallels Mac Management for SCCM", "found": false}]}
{"file": "pagina12.com.ar-suprema.html", "url": "https://www.pagina12.com.ar/419327-la-corte-suprema-no-imparte-justicia-sino-injusticia", "text_len": 7508, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Organismos de derechos", "found": true}, {"type": "with", "string": "entendi\u00f3 como un desaf\u00edo a los poderes", "found": true}, {"type": "with", "string": "desactivada durante el gobierno de Mauricio", "found": true}, {"type": "without", "string": "INGRESAR", "found": false}, {"type": "without", "string": "Imagen: T\u00e9lam", "found": false}, {"type": "without", "string": "Corte Suprema", "found": true}]}
{"file": "correio24horas.com.br-PMS.html", "url": "https://www.correio24horas.com.br/noticia/nid/lider-do-grupo-de-sequestradores-que-tinha-pms-foi-morto-em-confronto-policial/", "text_len": 2300, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "mediante sequestro, e que", "found": true}, {"type": "with", "string": "lotados na Rondesp Atl\u00e2ntico", "found": true}, {"type": "with", "string": "Ele tamb\u00e9m era investigado", "found": true}, {"type": "without", "string": "Em tempos de coronav\u00edrus e desinforma\u00e7\u00e3o", "found": false}, {"type": "without", "string": "(Foto: Tony Silva/Ascom-PC)", "found": false}, {"type": "without", "string": "Pol\u00edcia faz opera\u00e7\u00e3o de combate a", "found": false}]}
{"file": "lastampa.it.temperature.html", "url": "https://www.lastampa.it/cronaca/2020/02/19/news/temperature-in-calo-in-tutta-italia-attesa-neve-sull-appennino-1.38487954", "text_len": 2729, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "torner\u00e0 in poche ore", "found": true}, {"type": "with", "string": "sopra i 1400 metri.", "found": true}, {"type": "with", "string": "specialmente in Galles.", "found": true}, {"type": "without", "string": "La grande sete", "found": false}, {"type": "without", "string": "Argomenti", "found": false}, {"type": "without", "string": "Ultima modifica", "found": false}]}
{"file": "sass-ag.de.index.html", "url": "https://sass-ag.de", "text_len": 4613, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir beraten herstellerunabh\u00e4ngig und planen immer objektiv", "found": true}, {"type": "with", "string": "Kaufen Sie bei uns preiswerte Etiketten in Ihrem", "found": true}, {"type": "with", "string": "Wir bieten professionelle Drucksysteme f\u00fcr alle Anwendungsbereiche; ganz", "found": true}, {"type": "without", "string": "Produkte & Leistungen", "found": false}, {"type": "without", "string": "Zentrale Gilching", "found": false}, {"type": "without", "string": "St\u00f6rungen:", "found": false}]}
{"file": "bmfsfj.de-praesidentschaft.html", "url": "https://www.bmfsfj.de/bmfsfj/aktuelles/alle-meldungen/bundeskabinett-legt-schwerpunkte-der-praesidentschaft-fest-192440", "text_len": 3294, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gruppe der Sieben verst\u00e4ndigt", "found": false}, {"type": "with", "string": "Am 1. Januar hat Deutschland turnusgem\u00e4\u00df", "found": true}, {"type": "with", "string": "ein starkes Miteinander.", "found": true}, {"type": "without", "string": "G7 Germany 2022: Informationen zur", "found": false}, {"type": "without", "string": "Internationales und Europa", "found": false}, {"type": "without", "string": "Bundesregierung/Steffen Kugler", "found": false}]}
{"file": "blog.mondediplo.net.turpitude.html", "url": "https://blog.mondediplo.net/turpitude-et-architecture", "text_len": 4209, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "sation des rapports intercor\u00e9ens, il voit \u00e0 75 ans le rapprochement se r\u00e9aliser", "found": false}, {"type": "with", "string": "malgr\u00e9 tout l\u2019amiti\u00e9 et l\u2019entraide occupent une grande place", "found": true}, {"type": "with", "string": "hitecte de ressentir des moments de nostalgie en repensa", "found": true}, {"type": "without", "string": "arr\u00eate, on r\u00e9fl\u00e9chit", "found": false}, {"type": "without", "string": "des clefs du monde contemporain. Depuis le d\u00e9but du XXIe si\u00e8cle, le", "found": false}, {"type": "without", "string": "engagent que leurs auteurs.", "found": false}]}
{"file": "slf.ch-lawinensituation.html", "url": "https://www.slf.ch/de/lawinenbulletin-und-schneesituation/wochen-und-winterberichte/2021/22/wochenbericht-14-20-januar-2022.html", "text_len": 4414, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "dieser Satz fand sich mehrfach in", "found": true}, {"type": "with", "string": "In den Alpen zeigte sich dies mit wiederholt", "found": true}, {"type": "with", "string": "Diese f\u00fchrte zu einer deutlichen Abk\u00fchlung", "found": true}, {"type": "without", "string": "Die gr\u00f6sste Lawine dieser Berichtsperiode", "found": false}, {"type": "without", "string": "Oberfl\u00e4chenreif in einem Nordhang", "found": false}, {"type": "without", "string": "Lawinenbulletins dieser Zeitperiode im \u00dcberblick.", "found": true}]}
{"file": "majkaswelt.com.fashion.html", "url": "https://majkaswelt.com/top-5-fashion-must-haves-2018-werbung/", "text_len": 2409, "tp": 2, "fn": 1, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "R\u00fcschen und Volants.", "found": true}, {"type": "with", "string": "ihr jedes Jahr tragen k\u00f6nnt?", "found": true}, {"type": "with", "string": "mein\u00a0Lieblingskleid\u00a0vereint", "found": false}, {"type": "without", "string": "Das k\u00f6nnte dich auch interessieren", "found": false}, {"type": "without", "string": "Catherine Classic Lac 602", "found": false}]}
{"file": "tierschutz-berlin.de-boellerverzicht.html", "url": "https://tierschutz-berlin.de/aktuelles/tierschutzverein-ruft-zu-boellerverzicht-auf/", "text_len": 1958, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Vorstandsvorsitzende Eva R\u00f6nspie\u00df.", "found": true}, {"type": "with", "string": "ihre Lieblinge m\u00f6glichst gut gegen", "found": true}, {"type": "with", "string": "Silvesternacht gerade in Stadtrandbezirken", "found": true}, {"type": "without", "string": "Tierschutzverein f\u00fcr Berlin und Umgebung", "found": false}, {"type": "without", "string": "Bank f\u00fcr Sozialwirtschaft", "found": false}, {"type": "without", "string": "Hausvaterweg 39", "found": false}]}
{"file": "gothamist.com-plagues.html", "url": "https://gothamist.com/news/rezoning-plan-plagues-bronx-city-councilmembers-re-election-bid", "text_len": 3447, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "pitch to build a casino at the foot of the Whitestone Bridge", "found": true}, {"type": "with", "string": "buying the contract to operate Trump Golf Links Ferry Point", "found": true}, {"type": "with", "string": "earlier this year is also sparking opposition.", "found": true}, {"type": "without", "string": "We rely on your support to make local news available to all", "found": false}, {"type": "without", "string": "NYC election results: A surprisingly tight race in the Bronx as incumbents lead elsewhere", "found": false}, {"type": "without", "string": "Early Addition: Big year for sleeping with tape over your mouth", "found": false}]}
{"file": "bostonherald.com-Brothel-catering.html", "url": "https://www.bostonherald.com/2023/11/08/brothel-catering-to-politicians-doctors-lawyers-busted-in-boston/", "text_len": 3710, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "sex ring catering to wealthy doctors", "found": true}, {"type": "with", "string": "lawyers, politicians, and military officers who paid up to $600 an hour", "found": true}, {"type": "with", "string": "prostitutes was busted in Boston, the feds announced", "found": true}, {"type": "without", "string": "MOST POPULAR", "found": false}, {"type": "without", "string": "TRENDING NATIONALLY", "found": false}, {"type": "without", "string": "MORE IN LOCAL NEWS", "found": false}]}
{"file": "damianduchamps.wordpress.com.hbdi.html", "url": "https://damianduchamps.wordpress.com/2019/08/03/office-365-hbdi-die-dritte/", "text_len": 11116, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es bleibt weiterhin spannend", "found": true}, {"type": "with", "string": "Auch Schulen, die nicht unter 1", "found": true}, {"type": "with", "string": "Wie letzteres umzusetzen ist, daf\u00fcr", "found": true}, {"type": "without", "string": "Erstelle eine kostenlose Website oder Blog", "found": false}, {"type": "without", "string": "Um neue Beitr\u00e4ge per E-Mail zu", "found": false}, {"type": "without", "string": "Kommentar verfassen", "found": false}]}
{"file": "archive.modabot.de.serkan.html", "url": "https://web.archive.org/web/20190717140047/http://www.modabot.de/paris-haute-couture-ss14-serkan-cura", "text_len": 729, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "die diesmal leider keine Pr\u00e4sentation", "found": true}, {"type": "with", "string": "Die dabei entstehenden Silhouetten", "found": true}, {"type": "without", "string": "to see what your friends like", "found": false}, {"type": "without", "string": "Bild via", "found": false}]}
{"file": "archive.org.dimido.de.marketing.html", "url": "https://web.archive.org/web/20080731095558/http://www.dimido.de/2008/07/29/was-ist-virales-marketing/", "text_len": 788, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Marketing halten, habe aber keine Lust dazu, dies zu machen", "found": true}, {"type": "with", "string": "was unter Virales Marketing zu verstehen ist und wie wir unbewusst dadurch beeinflusst werden", "found": true}, {"type": "with", "string": "von Virales Marketing, habe ich festgestellt.", "found": true}, {"type": "without", "string": "besserwisser: Stecker ziehen f\u00fcr ne neue IP bringt nix.", "found": false}, {"type": "without", "string": "\u00fcbernimmt Cherry Corporation", "found": false}, {"type": "without", "string": " E-Mail (wird ben\u00f6tigt und nicht ver\u00f6ffentlicht)", "found": false}]}
{"file": "markeich.de.impressum.html", "url": "https://www.markeich.de/kontakt/impressum-werbeagentur-soltau/", "text_len": 2867, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "ngaben gem\u00e4\u00df \u00a7 5 TMG", "found": false}, {"type": "with", "string": "bieter oder Betreiber der Seiten verantwortlich. Die verlinkten Seiten wurden zum Zeitpunkt der Verlinkung auf m\u00f6gliche Rechtsverst\u00f6\u00dfe \u00fcberpr\u00fcft. Rechtsw", "found": false}, {"type": "with", "string": "rtlich f\u00fcr den Inhalt nach \u00a7 55 Abs. 2 RStV", "found": false}, {"type": "without", "string": "Auszeichnungen", "found": false}, {"type": "without", "string": "\u00a9 2020 Agentur MARKE ICH", "found": false}, {"type": "without", "string": "Es gilt die Datenschutzerkl\u00e4rung.", "found": false}]}
{"file": "cleanthinking.de.oranger-wasserstoff.html", "url": "https://www.cleanthinking.de/oranger-wasserstoff-erdkruste/", "text_len": 3298, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Franz\u00f6sische Forscher wollen", "found": true}, {"type": "with", "string": "Gr\u00fcner Wasserstoff und seine erneuerbaren", "found": true}, {"type": "with", "string": "Oranger Wasserstoff aus der Erdkruste:", "found": true}, {"type": "without", "string": "HINTERLASSE EINE ANTWORT", "found": false}, {"type": "without", "string": "Diese Website verwendet Akismet", "found": false}, {"type": "without", "string": "Buch-Tipp:", "found": false}]}
{"file": "greenpeace.de.nachhaltigleben.html", "url": "https://www.greenpeace.de/engagieren/nachhaltiger-leben", "text_len": 9647, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Jede:r Deutsche kauft im Schnitt ", "found": true}, {"type": "with", "string": "F\u00fcr vier gro\u00dfe industriell-genutzten Materialstr\u00f6me", "found": true}, {"type": "with", "string": "Als Gesellschaft k\u00f6nnen wir die Verantwortung", "found": true}, {"type": "without", "string": "PETITION", "found": false}, {"type": "without", "string": "Mehr zu Klima und Konsum", "found": false}, {"type": "without", "string": "Zum Weiterlesen", "found": false}]}
{"file": "coopbuddy.de.bee.html", "url": "https://www.coopbuddy.de/games/bee-simulator/", "text_len": 504, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Entdecke die gro\u00dfen Abenteuer", "found": true}, {"type": "with", "string": "Bee Simulator Mehrspieler", "found": true}, {"type": "with", "string": "Koop und Splitscreen-Modus", "found": true}, {"type": "without", "string": "Dieses Kommentarformular steht", "found": false}, {"type": "without", "string": "Splitscreen Coop", "found": false}, {"type": "without", "string": "Wenn ja, auf welcher Plattform?", "found": false}]}
{"file": "scmp.com.playbook.html", "url": "https://www.scmp.com/comment/opinion/article/3046526/taiwanese-president-tsai-ing-wens-political-playbook-should-be", "text_len": 336, "tp": 0, "fn": 3, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "almost insulting to Hongkongers", "found": false}, {"type": "with", "string": "a sign she was working hard for the", "found": false}, {"type": "with", "string": "using political shrewdness", "found": false}, {"type": "without", "string": "Alice Wu fell down the rabbit hole", "found": false}, {"type": "without", "string": "Lam staying on as chief executive", "found": false}, {"type": "without", "string": "Tsai says Beijing must face", "found": false}, {"type": "without", "string": "By registering, you agree to", "found": false}]}
{"file": "wikimediafoundation.org.turkey.html", "url": "https://wikimediafoundation.org/news/2020/01/15/access-to-wikipedia-restored-in-turkey-after-more-than-two-and-a-half-years/", "text_len": 3368, "tp": 2, "fn": 1, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "19th birthday", "found": true}, {"type": "with", "string": "Bu yaz\u0131n\u0131n T\u00fcrk\u00e7e\u2019sini buradan okuyabilirsiniz", "found": false}, {"type": "with", "string": "We will keep this statement updated", "found": true}, {"type": "without", "string": "Read further in the pursuit of knowledge", "found": false}, {"type": "without", "string": "what that means.", "found": false}, {"type": "without", "string": "Stay up-to-date on our work.", "found": false}, {"type": "without", "string": "Photo credits", "found": false}]}
{"file": "0b96fc66e2c94f45a1b923ec9a31fcf2.html", "url": "https://www.nachrichten.at/meine-welt/gesundheit/was-bringen-alternative-therapien-bei-krebs;art114,3177663", "text_len": 3351, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dar\u00fcber diskutieren Experten seit gestern", "found": true}, {"type": "with", "string": "Wer sollte also die Komplement\u00e4rmedizin anbieten?", "found": true}, {"type": "with", "string": "www.selbertun.at", "found": true}, {"type": "without", "string": "Leiterin Redaktion Leben", "found": false}, {"type": "without", "string": "Die O\u00d6Nachrichten nehmen den Schutz Ihrer Privatsph\u00e4re sehr ernst.", "found": false}, {"type": "without", "string": "3:1 - Vorw\u00e4rts Steyr half der SV Ried ", "found": false}]}
{"file": "erfolg-magazin.de.konfliktkultur.html", "url": "https://erfolg-magazin.de/mit-der-richtigen-konfliktkultur-zum-erfolg/", "text_len": 5534, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Unternehmen setzen alles", "found": true}, {"type": "with", "string": "Unser ganzes Leben geht es", "found": true}, {"type": "with", "string": "Und was am wichtigsten ist: ", "found": true}, {"type": "without", "string": "Will Smith: Selbsthilfeb\u00fccher als Teil seines Erfolgsgeheimnisses", "found": false}, {"type": "without", "string": "Impressum", "found": false}, {"type": "without", "string": "\u00bbWir brauchen Leute, die Entscheidungen treffen\u00ab", "found": false}]}
{"file": "publikum.net-HPV-Impfungen.html", "url": "https://publikum.net/japan-und-die-hpv-impfungen/", "text_len": 5558, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Vor langer, langer Zeit hatte ich schon einmal", "found": true}, {"type": "with", "string": "die Behauptung aufgegriffen", "found": true}, {"type": "with", "string": "Japan h\u00e4tte die HPV-Impfungen verboten", "found": true}, {"type": "without", "string": "Werde teil der Community!", "found": false}, {"type": "without", "string": "Melde dich jetzt an, um selbst Artikel zu verfassen", "found": false}, {"type": "without", "string": "zu kommentieren und mitzubestimmen", "found": false}]}
{"file": "d71bfdce9dd246c9a6ee6d08c8b39e4c.html", "url": "https://www.monsterdealz.de/user-deals/deals/gratisartikel-kostenlos/rewe-produkttest-10-000-produkttester-fuer-leibniz-keksn-cream-milk-oder-choco", "text_len": 422, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "\u201eAu\u00dfen knusprig, innen cremig\u201c", "found": true}, {"type": "with", "string": "Das beste kommt jetzt:", "found": true}, {"type": "with", "string": "Euer HansEhrlich", "found": true}, {"type": "without", "string": "Kostenlos zum Newsletter anmelden", "found": false}, {"type": "without", "string": "GRATIS-Jahresabo abstauben", "found": false}, {"type": "without", "string": "Top-Vergleiche", "found": false}, {"type": "without", "string": "Noch nicht angemeldet?", "found": false}]}
{"file": "mein-mmo.de-MMORPG.html", "url": "https://mein-mmo.de/silkroad-online-erstes-mmorpg-cringe-dieb/", "text_len": 7308, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die erste gro\u00dfe MMORPG-Liebe ist etwas ganz besonderes", "found": true}, {"type": "with", "string": "Selbst wenn viele Erinnerungen inzwischen ein wenig verschwommen sind", "found": true}, {"type": "with", "string": "wei\u00df ich noch sehr gut", "found": true}, {"type": "without", "string": "MEHR KOLUMNEN AUF MEINMMO", "found": false}, {"type": "without", "string": "KOMMENDE SPIELE", "found": false}, {"type": "without", "string": "NEUESTE ARTIKEL", "found": false}]}
{"file": "austria.info.radfahren.html", "url": "https://www.austria.info/de/aktivitaten/radfahren/radfahren-in-der-weltstadt-salzburg", "text_len": 926, "tp": 2, "fn": 1, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Salzburg liebt seine Radfahrer.", "found": true}, {"type": "with", "string": "Puls einsaugen zu lassen.", "found": true}, {"type": "with", "string": "Radfahren in der Fu\u00dfg\u00e4ngerzone der Innenstadt ist erlaubt", "found": false}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren ...", "found": false}, {"type": "without", "string": "So macht Radfahren sonst noch Spa\u00df", "found": false}]}
{"file": "katholisch.at-alleinerziehende.html", "url": "https://www.katholisch.at/aktuelles/136290/alleinerziehende-kinderbetreuung-flaechendeckend-ausbauen", "text_len": 2710, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "anl\u00e4sslich des internationalen", "found": true}, {"type": "with", "string": "kosteng\u00fcnstigen, niederschwelligen und", "found": true}, {"type": "with", "string": "Die Plattform f\u00fcr Alleinerziehende", "found": true}, {"type": "without", "string": "Einkommens sein", "found": false}, {"type": "without", "string": "wie etwa Caritas-Lerncaf\u00e9s", "found": false}, {"type": "without", "string": "Symposium des Akademikerverbands", "found": false}]}
{"file": "anarc.at.cdpath.html", "url": "https://anarc.at/blog/2020-10-18-cdpath-replacement/", "text_len": 2204, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": " I figured I might as well bite the", "found": true}, {"type": "with", "string": "Those projects can be used to track files", "found": true}, {"type": "with", "string": "this list through a command or the menu", "found": true}, {"type": "without", "string": "Contact", "found": false}, {"type": "without", "string": "Copyleft \u00a9 2002-2016 The Anarcat", "found": false}, {"type": "without", "string": " Powered by", "found": false}]}
{"file": "salon.com.emissions.html", "url": "https://www.salon.com/2020/01/10/despite-everything-u-s-emissions-dipped-in-2019_partner/", "text_len": 2710, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "This post originally", "found": false}, {"type": "with", "string": "The same can\u2019t be", "found": true}, {"type": "with", "string": "Cleaning up the electrical grid", "found": true}, {"type": "without", "string": "Credit:", "found": true}, {"type": "without", "string": "Advertisement:", "found": false}, {"type": "without", "string": "Reproduction of material from any", "found": false}]}
{"file": "corkbeo.ie.level.html", "url": "https://www.corkbeo.ie/news/local-news/level-3-live-cork-ireland-19056312", "text_len": 19018, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Tonight at midnight Cork will be moved into Level 3", "found": true}, {"type": "with", "string": "So we thought that this is not the", "found": true}, {"type": "with", "string": "Taoiseach Micheal Martin confirmed this evening that", "found": true}, {"type": "without", "string": "Never miss the latest news by signing", "found": true}, {"type": "without", "string": "Corrections and Clarifications", "found": false}, {"type": "without", "string": "The latest update for the Irish abroad", "found": false}]}
{"file": "swr.de-volleyball.html", "url": "https://www.swr.de/sport/mehr-sport/volleyball/mtv-stuttgart/stuttgart-ohne-rivers-im-finale-100.html", "text_len": 2228, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\"Was genau sie hat", "found": true}, {"type": "with", "string": "Lena Gro\u00dfe Scharmann \u00fcbernimmt", "found": true}, {"type": "with", "string": "letzten beiden Finalspielen", "found": true}, {"type": "without", "string": "Die meistgelesenen Artikel", "found": false}, {"type": "without", "string": "Gelten neue Regeln", "found": false}, {"type": "without", "string": "Corona-Alarmstufe", "found": false}]}
{"file": "falstaff.de-burgenland.html", "url": "https://www.falstaff.de/nd/burgenland-best-of-ruster-ausbruch-dac/", "text_len": 3267, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Jahr 2020 ist dieses Juwel aus", "found": false}, {"type": "with", "string": "Die sanften H\u00e4nge des Ruster H\u00fcgellands", "found": true}, {"type": "with", "string": "Ruster Ausbruch DAC", "found": true}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "ERSCHIENEN IN", "found": false}, {"type": "without", "string": "Rust am Westufer des", "found": true}]}
{"file": "natuerliche-jagd.de-seminar.html", "url": "https://www.natuerlich-jagd.de/allgemein/neue-djv-online-seminare/", "text_len": 1566, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Umgang mit den sozialen Medien sowie", "found": true}, {"type": "with", "string": "Wie m\u00fcssen Texte und Fotos daf\u00fcr", "found": true}, {"type": "with", "string": "t\u00e4tige Presseobleute aus den", "found": true}, {"type": "without", "string": "Quelle: Deutscher Jagdverband (DJV)", "found": true}, {"type": "without", "string": "Neue DJV-Online-Seminare starten im M\u00e4rz", "found": false}, {"type": "without", "string": "Folgen Sie uns", "found": false}]}
{"file": "guenter-pilger.de.mailaktion.html", "url": "https://www.guenter-pilger.de/mailaktion.htm", "text_len": 2474, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "ich protestiere gegen die erneute", "found": true}, {"type": "with", "string": "Geantwortet haben nur \"Die Linken\"", "found": true}, {"type": "with", "string": "in denen Sie die B\u00fcrger zur privaten", "found": true}, {"type": "without", "string": "Rentenpolitik | Blog | Mailaktion Bundestag | Alles klar?", "found": false}, {"type": "without", "string": "Startseite", "found": false}, {"type": "without", "string": "Partnerseiten", "found": false}]}
{"file": "axios.com.future.html", "url": "https://www.axios.com/newsletters/axios-future-7120a6cf-cf67-4e01-9f15-f73f114e8d27.html", "text_len": 3652, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "A new breed of intelligent video surveillance is being installed", "found": true}, {"type": "with", "string": "good kid, m.A.A.d city,\" the 5th song starts 19 ", "found": false}, {"type": "with", "string": "to school districts and universities, in addition to banks", "found": true}, {"type": "without", "string": "Axios newsletters", "found": false}, {"type": "without", "string": "Online tracking choices", "found": false}, {"type": "without", "string": "Axios podcasts", "found": false}]}
{"file": "bfs.de-radon.html", "url": "https://www.bfs.de/SharedDocs/Pressemitteilungen/BfS/DE/2022/001.html", "text_len": 5859, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "richtet sich an alle, die sich \u00fcber die Radon-Situation", "found": true}, {"type": "with", "string": "dar\u00fcber hinaus bereits vorhandene Messdaten", "found": true}, {"type": "with", "string": "nur mit einer Radon-Messung im Boden", "found": true}, {"type": "without", "string": "Was ist Radon?", "found": false}, {"type": "without", "string": "Radon in der Boden-Luft in Deutschland", "found": false}, {"type": "without", "string": "Wie bewerten Sie diesen Artikel?", "found": false}]}
{"file": "achtundvierzig.hypotheses.org.822.html", "url": "https://achtundvierzig.hypotheses.org/822", "text_len": 1556, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das DFG-Projekt \u201eEdition der Akten", "found": true}, {"type": "with", "string": "Kulturgeschichte des Politischen", "found": true}, {"type": "with", "string": "eine zeitliche Konzentration", "found": true}, {"type": "without", "string": "Vorheriger Beitrag", "found": false}, {"type": "without", "string": "Deine E-Mail-Adresse wird nicht ver\u00f6ffentlicht.", "found": false}, {"type": "without", "string": "Diese Website verwendet Akismet", "found": false}]}
{"file": "pcgamer.com.darkest.html", "url": "https://www.pcgamer.com/through-the-darkest-of-times-review/", "text_len": 6076, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "your grip on the concept further, by saying little more than \"go s", "found": true}, {"type": "with", "string": "Developer Paintbucket Games", "found": true}, {"type": "with", "string": "A superbly crafted game that serves as storyteller, teacher, and concerned friend.", "found": false}, {"type": "without", "string": "PC Gamer Newsletter", "found": false}, {"type": "without", "string": "C Gamer is supported by its audience. When you buy throu", "found": false}, {"type": "without", "string": "Also on PC Gamer", "found": false}]}
{"file": "thelist.com.multivitamin.html", "url": "https://www.thelist.com/214894/when-you-take-a-multivitamin-every-day-this-is-what-happens-to-your-body/", "text_len": 16695, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Do you take a multivitamin every day?", "found": true}, {"type": "with", "string": "sleeping for seven to nine hours a night", "found": true}, {"type": "with", "string": "help steel yourself against any nutritional fallout.", "found": true}, {"type": "without", "string": "If you take turmeric every day, you might", "found": false}, {"type": "without", "string": "retro-hipster chic (so 2010!) to your bathroom.", "found": false}, {"type": "without", "string": "everyone has different nutritional needs, and she", "found": false}]}
{"file": "jagdoesterreich.at-Parkpl\u00e4tze.html", "url": "https://www.jagd-oesterreich.at/2021/12/14/noe-jagdverband-auf-natur-wildtier-beduerfnisse-achten/", "text_len": 4423, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ruhe, \u00c4sung und Deckung.", "found": false}, {"type": "with", "string": "Immer auf (Forst-)Stra\u00dfen oder", "found": true}, {"type": "with", "string": "Parkverbote missachten und auf Forst-", "found": true}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "N\u00d6 Jagdverband: Auf Natur", "found": false}, {"type": "without", "string": "FOLGEN SIE UNS:", "found": false}]}
{"file": "rosalux.de-quarantaene.html", "url": "https://www.rosalux.de/news/id/45292/wir-waren-fast-40-tage-in-quarantaene?cHash=39ac749d120d127296ab076c203053d3", "text_len": 6771, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir waren fast 40 Tage in Quarant\u00e4ne", "found": false}, {"type": "with", "string": "Wo sind Sie in die", "found": true}, {"type": "with", "string": "Es war nach dem", "found": true}, {"type": "without", "string": "zum Thema", "found": false}, {"type": "without", "string": "Teilen:", "found": false}, {"type": "without", "string": "z\u00e4hlt f\u00fcr sie nicht", "found": false}]}
{"file": "arteradio.com-nuls.html", "url": "https://www.arteradio.com/son/61661515/la_voix_des_nuls", "text_len": 1442, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "revendication prend chaque", "found": true}, {"type": "with", "string": "jour par les \"gilets", "found": true}, {"type": "with", "string": "sp\u00e9cialiste du sujet.", "found": true}, {"type": "without", "string": "Vous aimerez aussi", "found": false}, {"type": "without", "string": "Tous nos derniers podcasts", "found": false}, {"type": "without", "string": "de messagerie est uniquement", "found": false}]}
{"file": "motorsport-total.com-romeo.html", "url": "https://www.motorsport-total.com/formel-1/news/nach-erstem-f1-test-2022-alfa-romeo-plant-spaeten-launch-des-c42-22020203", "text_len": 2518, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Team best\u00e4tigte am Mittwoch, dass sein neues Auto", "found": true}, {"type": "with", "string": "25. Februar auf dem Circuit de Barcelona-Catalunya", "found": true}, {"type": "with", "string": "Giovinazzi und werden versuchen", "found": true}, {"type": "without", "string": "Was kostet eine Solaranlage", "found": false}, {"type": "without", "string": "Lada Niva Monster: Russlands", "found": false}, {"type": "without", "string": "auf dem Formel-1-Auto f\u00fcr 2022", "found": false}]}
{"file": "buchperlen.wordpress.com.html", "url": "https://buchperlen.wordpress.com/2013/10/20/leandra-lou-der-etwas-andere-modeblog-jetzt-auch-zwischen-buchdeckeln/", "text_len": 3675, "tp": 2, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "Dann sollten Sie erst recht", "found": true}, {"type": "with", "string": "als saure G\u00fcrkchen entlarvte Ex-Boyfriends.", "found": true}, {"type": "without", "string": "US-Musiker Lou Reed", "found": false}]}
{"file": "bigdata.ypart.eu.datenerhebung.html", "url": "https://bigdata.ypart.eu/page/Digitale_Datenerhebung_und_verwertung_als_Herausforderung_f%C3%BCr_Medienbildung_und_Gesellschaft.html", "text_len": 19842, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das vorliegende Papier wurde f\u00fcr die Gesellschaft f\u00fcr Medienp\u00e4dagogik", "found": true}, {"type": "with", "string": "F\u00fcr Nutzende digitaler Dienste ist es derzeit nahezu unm\u00f6glich zu erkennen", "found": true}, {"type": "with", "string": "Das Digitale ist zur globalen Infrastruktur geworden.", "found": true}, {"type": "without", "string": "Diese Plattform wird betrieben vom", "found": false}, {"type": "without", "string": "In Kooperation mit", "found": false}, {"type": "without", "string": "Follow us on Twitter", "found": false}]}
{"file": "archive.org-travaillent.html", "url": "https://web.archive.org/web/20070228213001/http://www.alternatives-economiques.fr/site/hs72_003_35heures.html", "text_len": 11012, "tp": 2, "fn": 1, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "autres travaillent moins", "found": true}, {"type": "with", "string": "350 000 emplois cr\u00e9\u00e9s", "found": false}, {"type": "with", "string": "\u00e2ge effectif de", "found": true}, {"type": "without", "string": "Le march\u00e9 du travail est-il trop", "found": true}, {"type": "without", "string": "Hors-s\u00e9rie n\u00b0 72", "found": true}, {"type": "without", "string": "L\u2019\u00e9tat de l\u2019\u00e9conomie", "found": true}]}
{"file": "newrepublic.com.neoliberalism.html", "url": "https://newrepublic.com/article/155970/collapse-neoliberalism", "text_len": 23348, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "With the 2008 financial crash and the Great Recession", "found": true}, {"type": "with", "string": "Start with the economy. Over the course", "found": true}, {"type": "with", "string": "The central question of our time", "found": true}, {"type": "without", "string": "Ganesh Sitaraman is a professor at Vanderbilt Law School", "found": false}, {"type": "without", "string": "Read More", "found": false}, {"type": "without", "string": "Most Popular", "found": false}]}
{"file": "oekolaundbau.de-zweinutzungshuhns.html", "url": "https://oekolandbau.de/service/nachrichten/detailansicht/tag-des-zweinutzungshuhns-am-22-januar/", "text_len": 3238, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "einem echten Zweinutzungstier? Die \u00d6kotierzucht", "found": false}, {"type": "with", "string": "wurden. Hier in Deutschland", "found": true}, {"type": "with", "string": "halten inzwischen \u00d6TZ-Tiere", "found": true}, {"type": "without", "string": "Thema auf Oekolandbau.de", "found": false}, {"type": "without", "string": "Alternativen zum K\u00fckent\u00f6ten", "found": false}, {"type": "without", "string": "Foto: \u00d6TZ", "found": false}]}
{"file": "correiobraziliense.com.br-poderes.html", "url": "https://www.correiobraziliense.com.br/politica/2022/05/5005250-de-novo-em-busca-da-tregua-institucional.html", "text_len": 5788, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "do Senado, Rodrigo Pacheco (PSD-MG)", "found": true}, {"type": "with", "string": "o Supremo Tribunal Federal", "found": true}, {"type": "with", "string": "Com o mesmo repert\u00f3rio das manifesta\u00e7\u00f5es", "found": true}, {"type": "without", "string": "(cr\u00e9dito: Minervino J\u00fanior", "found": false}, {"type": "without", "string": "urg\u00eancia para barrar", "found": true}, {"type": "without", "string": "Pela Web", "found": false}]}
{"file": "toralin.de.schmierfett.html", "url": "http://www.toralin.de/schmierfett-reparierend-verschlei-y-910.html", "text_len": 1506, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Die Lebensdauer von Bauteilen erh\u00f6ht sich betr\u00e4chtlich.", "found": true}, {"type": "with", "string": "bis zu 50% Verschlei\u00df.", "found": true}, {"type": "with", "string": "Li-Seifen/Mineral\u00f6l", "found": true}, {"type": "without", "string": "Newsletter", "found": false}, {"type": "without", "string": "Wie bewerten Sie diesen Artikel?", "found": false}, {"type": "without", "string": "Meander 151", "found": false}, {"type": "without", "string": "Sie k\u00f6nnten auch an folgenden Artikeln interessiert sein", "found": false}]}
{"file": "weselpower.wordpress.com.monstergesprche.html", "url": "https://weselpower.wordpress.com/2009/12/23/monstergesprche-1/", "text_len": 122, "tp": 1, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "M:Wer rutscht als n\u00e4chstes aus auf dem Glatteis?", "found": true}, {"type": "without", "string": "Teilen Sie dies mit:", "found": false}, {"type": "without", "string": "Bloggern gef\u00e4llt das.", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": " Kommentare sind geschlossen. ", "found": false}]}
{"file": "archive.org.dzs-clan.de.html", "url": "https://web.archive.org/web/20110106023242/http://dzs-clan.de/index.php?site=news_comments&newsID=111", "text_len": 3886, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "In dieser News m\u00f6chten wir euch \u00fcber das Geschehen", "found": true}, {"type": "with", "string": "Diese Nachrichten k\u00f6nnt ihr auch auf unserer Homepage in unserer Twitter-Box lesen.", "found": true}, {"type": "with", "string": "Aller Voraussicht nach wird dieses auf der kommenden", "found": true}, {"type": "without", "string": "Hi, ihr habt das falsche Statment von mir", "found": false}, {"type": "without", "string": "sein um Kommentare zu schreiben!", "found": true}, {"type": "without", "string": "\u00a9 2010 by dzs", "found": false}]}
{"file": "tvtoday.de-willsmith.html", "url": "https://www.tvtoday.de/entertainment/kino-news/will-smith-gestoertes-verhaeltnis-zu-sohn-trey-205331.html", "text_len": 2435, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u00e4ltesten Spross im Alter von gerade", "found": true}, {"type": "with", "string": "Immer wieder posten", "found": true}, {"type": "with", "string": "hat der Familienvater", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Sie auch", "found": false}, {"type": "without", "string": "Kinoprogramm-Suche", "found": false}, {"type": "without", "string": "Judy Eddy/WENN.com", "found": false}]}
{"file": "dsv.de-synchronschwimmen.html", "url": "https://www.dsv.de/synchronschwimmen/aktuelles-synchronschwimmen/lesen/?tx_ttnews%5Btt_news%5D=5793&cHash=36febeba61a32f5c94f98d8f59efb32e", "text_len": 2442, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "also, dass die filigranen Meerestiere als", "found": true}, {"type": "with", "string": "Die Kosten f\u00fcr den Levelpass belaufen", "found": true}, {"type": "with", "string": "dokumentiert. \u201eSo haben die Kinder auch etwas", "found": true}, {"type": "without", "string": "UNSERE PARTNER - SYNCHRONSCHWIMMEN", "found": false}, {"type": "without", "string": "KOMMENDE EVENTS", "found": false}, {"type": "without", "string": "TERMINE / AUSSCHREIBUNGEN", "found": false}]}
{"file": "0a29620f9c4347758c146ed06dab6f3e.html", "url": "https://www.tagblatt.ch/kultur/mit-allen-wassern-gewaschen-ld.1161246", "text_len": 3823, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nirgends und \u00fcberall ist das Gedicht,", "found": true}, {"type": "with", "string": "Rund 75 Minuten lang sp\u00fcrt man den", "found": true}, {"type": "with", "string": "die Kunst, das Leben auf sich herabregnen zu lassen.", "found": true}, {"type": "without", "string": "Ein Kippmoment in", "found": false}, {"type": "without", "string": "Abonnemente", "found": false}, {"type": "without", "string": "Online Inserat aufgeben", "found": false}]}
{"file": "freitag.de.morgen.html", "url": "https://www.freitag.de/autoren/benjamin-immanuel-hoff/heute-schon-an-morgen-denken", "text_len": 18778, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Kommunen, die L\u00e4nder und der Bund einschneidende", "found": true}, {"type": "with", "string": "Durch die Beschr\u00e4nkungen des \u00f6ffentlichen Lebens wurde erreicht", "found": true}, {"type": "with", "string": "Kultur mit dem gemeinwirtschaftlichen Gedanken des Genossenschaftswesens verbinden", "found": true}, {"type": "without", "string": "\u00a9 der Freitag Mediengesellschaft mbH & Co. KG", "found": false}, {"type": "without", "string": "Beitrag gibt die Meinung des Autors wieder, nicht notwendigerweise die der Redaktion des Freitag.", "found": false}, {"type": "without", "string": "Beitrag handelt es sich um ein Blog aus der Freitag-Community", "found": false}]}
{"file": "public.spot-on-news.de-Traumfrau.html", "url": "https://public.spot-on-news.de/neue-traumfrau-bei-sturm-der-liebe-so-geht-es-am-fuerstenhof-weiter/", "text_len": 2713, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Und jetzt steht die 20. Staffel der Erfolgsserie", "found": true}, {"type": "with", "string": "rund um die Geschehnisse am F\u00fcrstenhof in den Startl\u00f6chern", "found": true}, {"type": "with", "string": "Wie die Macher bekannt gaben", "found": true}, {"type": "without", "string": "Mehr \u00fcber TV", "found": false}, {"type": "without", "string": "Judith Williams als Rategast im \u201eThe Masked Singer\u201c-Finale", "found": false}, {"type": "without", "string": "Lindholm zur\u00fcck in Hannover: \u201eTatort\u201c-Ende f\u00fcr das G\u00f6ttinger Team", "found": false}]}
{"file": "bondyblog.fr.paris-8.html", "url": "https://www.bondyblog.fr/societe/a-paris-8-un-peu-de-tension-beaucoup-d-actions/", "text_len": 6724, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Une gr\u00e8ve reconductible \u00e0 partir du 5 mars", "found": true}, {"type": "with", "string": "Marie-Pierre ne fait plus de cours", "found": true}, {"type": "with", "string": "Solidaires \u00c9tudiant-e-s Saint-Denis", "found": true}, {"type": "without", "string": "Candidatures ouvertes pour le Prix", "found": false}, {"type": "without", "string": "Intervenant \u00e0 l\u2019atelier", "found": false}, {"type": "without", "string": "Le piquet de gr\u00e8ve dans le hall", "found": false}]}
{"file": "gazetadopovo.com.br-pacheco.html", "url": "https://www.gazetadopovo.com.br/republica/o-que-pacheco-pretende-acenos-ao-stf-e-propor-limites-ao-indulto-presidencial/", "text_len": 14100, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "e nas faixas de manifestantes", "found": true}, {"type": "with", "string": "Esplanada dos Minist\u00e9rios como", "found": true}, {"type": "with", "string": "dos Poderes, n\u00e3o s\u00f3 com manifesta\u00e7\u00f5es", "found": true}, {"type": "without", "string": "VEJA TAMB\u00c9M:", "found": false}, {"type": "without", "string": "indulto em outras a\u00e7\u00f5es", "found": false}, {"type": "without", "string": "a batalha dos palanques em S\u00e3o Paulo", "found": true}]}
{"file": "SW1.News-Heimat.html", "url": "https://sw1.news/fussball/fussball-kreisklassen/wenn-man-in-der-heimat-verliert-dann-tuts-in-abwesendheit-vielleicht-ein-bisschen-weniger-weh/", "text_len": 1328, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Der VfB Humprechtshausen spielte", "found": true}, {"type": "with", "string": "bislang eine recht ordentliche Saison", "found": true}, {"type": "with", "string": "brachte der SG Abersfeld bisher deren einzige Niederlage bei", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Dich auch interessieren:", "found": false}, {"type": "without", "string": "ANZEIGE - Heute mal ausgehen/bestellen? Wie w\u00e4re es mit:", "found": true}, {"type": "without", "string": "Wie erwartet machen die beiden Strahlunger Spielertrainer \u00fcber die Saison hinaus weiter", "found": false}]}
{"file": "polizeiticker.ch-Unfall.html", "url": "https://polizeiticker.ch/artikel/studen-be-a6-nach-toedlichem-unfall-fuer-mehrere-stunden-gesperrt-219645", "text_len": 1087, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Am Sonntag, 5. November 2023, kurz nach 21.25 Uhr", "found": true}, {"type": "with", "string": "wurde der Kantonspolizei Bern auf der A6 bei Studen ein schwerer Verkehrsunfall gemeldet", "found": true}, {"type": "with", "string": "Aus ungekl\u00e4rten Gr\u00fcnden fuhr ein Autolenker im Bereich der Ausfahrt", "found": true}, {"type": "without", "string": "KANTONS-SUDOKU", "found": false}, {"type": "without", "string": "KANTONS\u00dcBERSICHT", "found": false}, {"type": "without", "string": "FAHNDUNGEN", "found": false}]}
{"file": "mein-schoener-garten.de-topinabur.html", "url": "https://www.mein-schoener-garten.de/news/3-profi-tipps-rund-um-die-topinambur-ernte-48412", "text_len": 3840, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Winter Gem\u00fcse frisch aus dem Garten", "found": true}, {"type": "with", "string": "Pflanze sind nahrhaft, ballaststoffreich und", "found": true}, {"type": "with", "string": "Der Boden ist gefroren. Dagegen hilft", "found": true}, {"type": "without", "string": "Empfehlungen aus dem", "found": false}, {"type": "without", "string": "Verwandte Artikel", "found": false}, {"type": "without", "string": "R\u00fcben: Sch\u00e4tze aus dem Untergrund", "found": false}]}
{"file": "moritz-meyer.net.vreni.html", "url": "https://moritz-meyer.net/blog/vreni-frost-instagram-abmahnung/", "text_len": 21087, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das ist alles nicht gekennzeichnet, wie soll ich wissen", "found": true}, {"type": "with", "string": "Instagramshops machen es Abmahnanw\u00e4lten leicht", "found": true}, {"type": "with", "string": "Ich bin der Ansicht, abwarten und Tee trinken.", "found": false}, {"type": "without", "string": "Diese Geschichte teilen", "found": false}, {"type": "without", "string": "Diese Website verwendet Akismet, um Spam zu reduzieren.", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}]}
{"file": "d041d20a0bc04fdf8cef73f750f20bf6.html", "url": "https://www.gamestar.de/videos/der-landwirtschafts-simulator-19-wird-ein-jahr-nach-release-groesser-trailer-stellt-platinum-edition-vor,99770.html", "text_len": 936, "tp": 2, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "auf Windows PCs, Mac, Xbox One und PS4. Der Trailer gibt euch einen kurzen \u00dcberblick zu den zus\u00e4tzlichen Inhalten.", "found": true}, {"type": "with", "string": "als eigenst\u00e4ndiges Spiel und wird zudem", "found": true}, {"type": "without", "string": "Kommentare", "found": false}, {"type": "without", "string": "alle anzeigen", "found": false}, {"type": "without", "string": "Nur angemeldete Benutzer k\u00f6nnen kommentieren und bewerten.", "found": false}, {"type": "without", "string": "Steam", "found": false}]}
{"file": "fincompare.de.firmenwagen.html", "url": "https://fincompare.de/firmenwagen-leasing-oder-finanzierung", "text_len": 9350, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "In diesem Artikel stellen wir die wichtigsten Punkte und vor allem die steuerlichen Aspekte", "found": true}, {"type": "with", "string": "ist die H\u00f6he der Monatsraten dementsprechend niedriger als beim Kilometerleasing.", "found": true}, {"type": "with", "string": "Kann nicht steuerlich geltend gemacht werden", "found": true}, {"type": "without", "string": "Umsatzsteuererstattung bei Leasing und Mietkauf?", "found": false}, {"type": "without", "string": "Nutzen Sie FinCompare als Wettbewerbsvorteil", "found": true}, {"type": "without", "string": "vielf\u00e4ltige Suchoptionen, Transparenz, \u00dcbersichtlichkeit", "found": false}]}
{"file": "omeda.de-paxlovid.html", "url": "https://www.onmeda.de/krankheiten/coronavirus/paxlovid-id212627/", "text_len": 6431, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "durch das Coronavirus. Erfahren Sie", "found": true}, {"type": "with", "string": "Pr\u00e4parat namens Molnupiravir brachte", "found": true}, {"type": "with", "string": "Menschen mit einem erh\u00f6hten Risiko", "found": true}, {"type": "without", "string": "Dieser Text entspricht den", "found": true}, {"type": "without", "string": "Covid-19 oder Grippe?", "found": false}, {"type": "without", "string": "Tsch\u00fcss, Bauchfett! Hilfe", "found": false}]}
{"file": "ebike-mtb.com-OFFROAD.html", "url": "https://ebike-mtb.com/advanced-offroad-pro-race-mtb-fs-test/", "text_len": 10020, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ihr habt von der deutschen E-Bike-Brand Advanced noch nie etwas geh\u00f6rt?", "found": true}, {"type": "with", "string": "Macht nix, wir kl\u00e4ren euch auf.", "found": true}, {"type": "with", "string": "Im City- und Trekking-Bereich ist Advanced bereits gut etabliert.", "found": true}, {"type": "without", "string": "Der Artikel gef\u00e4llt dir?", "found": false}, {"type": "without", "string": "Melde dich f\u00fcr unseren Newsletter an!", "found": false}, {"type": "without", "string": "Empfohlen f\u00fcr dich", "found": false}]}
{"file": "einfachspanien.de.malaga.html", "url": "http://www.einfachspanien.de/malaga-die-quirlige-metropole-in-andalusien.html", "text_len": 1931, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Spanien hat als Reiseland", "found": true}, {"type": "with", "string": "Wer Malaga nicht nur", "found": true}, {"type": "with", "string": "Einfluss auf die Freundlichkeit", "found": true}, {"type": "without", "string": "Keine Kommentare for", "found": false}, {"type": "without", "string": "Wussten Sie schon...?", "found": false}, {"type": "without", "string": "Warning: Creating default object", "found": false}]}
{"file": "fluter.de.vorbild.html", "url": "https://www.fluter.de/corona-big-data-suedkorea-vorbild-fuer-deutschland", "text_len": 7624, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Felix Stalder: Zu wissen, mit wem Corona-Patienten", "found": true}, {"type": "with", "string": "gleichzeitig Dutzende, vielleicht sogar Hunderte Nutzer eingew\u00e4hlt.", "found": true}, {"type": "with", "string": "m\u00f6glich zu machen. In jedem Fall bricht eine ander", "found": true}, {"type": "without", "string": "Titelbild:", "found": true}, {"type": "without", "string": "Auch interessant", "found": false}, {"type": "without", "string": "Dieser Text wurde ver\u00f6ffentlicht", "found": false}]}
{"file": "djz.de-amoklauf.html", "url": "https://djz.de/amoklauf-in-heidelberg-rufe-nach-schneller-aufklaerung/", "text_len": 1721, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "einer Meldung von heute.", "found": true}, {"type": "with", "string": "FWR fordere eine schnelle und umfassende", "found": true}, {"type": "with", "string": "und Europa verhindern.", "found": true}, {"type": "without", "string": "DJV-Verbandsbericht ver\u00f6ffentlicht", "found": false}, {"type": "without", "string": "Vorheriger Artikel", "found": false}, {"type": "without", "string": "Immer mehr Wildschweine in K\u00f6ln", "found": false}]}
{"file": "humanresourcesmanager.de.diversity.html", "url": "https://www.humanresourcesmanager.de/future-of-work/gender-diversity-revolution-im-reallabor-women-digit-praxislaboratorien-atruvia/", "text_len": 6343, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Bulgarien hat uns einiges voraus,", "found": true}, {"type": "with", "string": "In Praxislabs die Zukunft", "found": true}, {"type": "with", "string": "Agilit\u00e4t wirkt.", "found": true}, {"type": "without", "string": "Weitere Beitr\u00e4ge aus der Kolumne:", "found": true}, {"type": "without", "string": "Unser Newsletter", "found": false}, {"type": "without", "string": "Verwandte Artikel", "found": false}]}
{"file": "archive.org.welpenkaufen24.de.html", "url": "https://web.archive.org/web/20160401095740/http://www.welpenkaufen24.de/", "text_len": 1049, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "dass Bekannte bei unseri\u00f6sen Z\u00fcchtern", "found": true}, {"type": "with", "string": "Beschimpfungen akzeptiere ich aber nicht unter den Kommentaren.", "found": true}, {"type": "with", "string": "m\u00f6chte ich in diesem Blog den ein oder", "found": true}, {"type": "without", "string": "Hunderassen", "found": true}, {"type": "without", "string": "Welcher Hund passt zu mir?", "found": false}, {"type": "without", "string": "Erforderliche Felder sind markiert", "found": false}]}
{"file": "Osthessen-news.de-Buergermeisterwahl.html", "url": "https://osthessen-news.de/n11752374/claudia-brandes-und-ihr-links-gruenes-buendnis-muessen-jetzt-liefern.html", "text_len": 2145, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zun\u00e4chst ist festzustellen", "found": true}, {"type": "with", "string": "dass die CDU in Petersberg und ihr B\u00fcrgermeister", "found": true}, {"type": "with", "string": "in den vergangenen sechs Jahren nicht unbedingt einen harmonischen Eindruck hinterlassen haben", "found": true}, {"type": "without", "string": "DEIN HEIMATPODCAST", "found": false}, {"type": "without", "string": "Petersberg B\u00fcrgermeisterwahl - weitere Artikel", "found": false}, {"type": "without", "string": "DEN RICHTIGEN FINDEN", "found": false}]}
{"file": "frolleinherr.com.lost.html", "url": "https://frolleinherr.com/thoughts/kolumne-lost-aber-immer-noch-da/ ", "text_len": 13509, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Einige sehr aufmerksame", "found": true}, {"type": "with", "string": "Es ist so: Mein", "found": true}, {"type": "with", "string": "An dieser Stelle sei gesagt:", "found": true}, {"type": "without", "string": "11 Antworten zu", "found": true}, {"type": "without", "string": "Impressum", "found": false}, {"type": "without", "string": "Schon gelesen?", "found": false}]}
{"file": "strafprozess.ch.polizisten.html", "url": "https://www.strafprozess.ch/rasende-polizisten/", "text_len": 405, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Auch Polizisten im Dienst", "found": true}, {"type": "with", "string": "Das Bundesgericht kassiert", "found": true}, {"type": "with", "string": "signalisierte H\u00f6chstgeschwindigkeit", "found": true}, {"type": "without", "string": "Ege/Heimgartner/Niggli (Hrsg.)", "found": false}, {"type": "without", "string": "Drucken etc.", "found": false}, {"type": "without", "string": "10. Dreil\u00e4nderforum in Bregenz", "found": false}]}
{"file": "anchor.ch.lanka.html", "url": "https://www.anchor.ch/gesellschaft/ein-tag-aus-dem-leben-eines-taugenichts-oder-die-leute-von-sri-lanka/", "text_len": 19405, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es ist sechs Uhr fr\u00fch und noch stockdunkel", "found": true}, {"type": "with", "string": "f\u00fchren diese improvisierten T\u00fcten aus Sch\u00fclernotizen.", "found": true}, {"type": "with", "string": "Kumara kennt mich recht gut", "found": true}, {"type": "without", "string": "Deine E-Mail-Adresse wird nicht ver\u00f6ffentlicht", "found": false}, {"type": "without", "string": "Blog via E-Mail abonnieren", "found": false}, {"type": "without", "string": "Peter Addor ist Mathematiker, Systemdenke", "found": false}]}
{"file": "klaenge-des-verschweigens.de.geschichte.html", "url": "http://www.klaenge-des-verschweigens.de/film/geschichte/", "text_len": 2505, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das \u201eschwarze Schaf\u201c unserer Familie", "found": true}, {"type": "with", "string": "Durch das Aufbl\u00e4ttern eines Familiengeheimnisses", "found": true}, {"type": "with", "string": "Wobei Musik fundamental beteiligt wird", "found": true}, {"type": "without", "string": "Unterst\u00fctze das Projekt:", "found": false}, {"type": "without", "string": "Ein detektivisches Dokumentarprojekt", "found": false}, {"type": "without", "string": "Gef\u00f6rdert durch:", "found": false}]}
{"file": "automobilwoche.de-VW-Betriebsversammlung.html", "url": "https://www.automobilwoche.de/article/20211103/AGENTURMELDUNGEN/311039909/1276/krach-vor-der-vw-betriebsversammlung-es-knirscht-zwischen-diess-und-aufsichtsraeten", "text_len": 2289, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "bei VW mehren sich", "found": false}, {"type": "with", "string": "VW-Chef Herbert Diess:", "found": false}, {"type": "with", "string": "Haussegen h\u00e4ngt schief", "found": true}, {"type": "without", "string": "Starker R\u00fcckgang im Oktober:", "found": false}, {"type": "without", "string": "Die neuesten Aufzeichnungen", "found": false}, {"type": "without", "string": "Jobs in der Autobranche", "found": false}]}
{"file": "digitalcourage.de-Muendigkeit.html", "url": "https://digitalcourage.de/blog/2023/buch-digitale-muendigkeit", "text_len": 6502, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Haben auch Sie den Eindruck", "found": true}, {"type": "with", "string": "dass unsere Welt gerade aus den Fugen ger\u00e4t", "found": true}, {"type": "with", "string": "Unser achtloser Umgang mit digitalen Medien", "found": true}, {"type": "without", "string": "Buch bestellen", "found": false}, {"type": "without", "string": "Ist Ihnen beim Betreten dieser Seite etwas aufgefallen?", "found": false}, {"type": "without", "string": "Wir haben Sie nicht mit einer Cookieabfrage genervt.", "found": false}]}
{"file": "industriemagazin.at-Luftfahrtbranche.html", "url": "https://industriemagazin.at/news/luftfahrtbranche-hebt-nach-corona-ab-und-facc-profitiert/", "text_len": 4656, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In der Luftfahrt geht es nach der Pandemie wieder rasant bergauf.", "found": true}, {"type": "with", "string": "Davon ist auch der ober\u00f6sterreichische Luftfahrtzulieferer FACC deutlich betroffen.", "found": true}, {"type": "with", "string": "Wir haben einen gewaltigen Auftragseingang", "found": true}, {"type": "without", "string": "Entdecken Sie jetzt", "found": false}, {"type": "without", "string": "Sie wollen mehr von uns?", "found": false}, {"type": "without", "string": "Weitere interessante Artikel", "found": false}]}
{"file": "blogoff.de.i-htm.html", "url": "https://blogoff.de/2015/11/12/i-htm/", "text_len": 688, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In Berlin lebe ich nun", "found": true}, {"type": "with", "string": "Vielen Dank an die S-Bahn", "found": true}, {"type": "with", "string": "Base Flying", "found": true}, {"type": "without", "string": "I \u2665 BLOG OFF!", "found": false}, {"type": "without", "string": "Was passiert hier eigentlich noch?", "found": false}, {"type": "without", "string": "powdered by wordpress", "found": false}]}
{"file": "wired.com.burn.html", "url": "https://www.wired.com/story/ai-great-things-burn-planet/", "text_len": 4168, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Last month, researchers at OpenAI in San Francisco revealed", "found": true}, {"type": "with", "string": "As more companies across more industries begin", "found": true}, {"type": "with", "string": "including the energy needed to build it", "found": true}, {"type": "without", "string": "One algorithm that lets a robot manipulate a Rubik", "found": false}, {"type": "without", "string": "The latest on artificial intelligence, from machine learning to computer vision and more", "found": false}, {"type": "without", "string": "writer for WIRED, covering artificial intelligence", "found": false}]}
{"file": "winfuture.de-NASA.html", "url": "https://winfuture.de/news,139377.html", "text_len": 3655, "tp": 3, "fn": 0, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "Wir starten mehr als Raketen", "found": true}, {"type": "with", "string": "Der Start der Plattform ist Bestandteil einer weitgehenden \u00dcberarbeitung", "found": true}, {"type": "with", "string": "der digitalen Plattformen, die die NASA im Sommer angek\u00fcndigt hatte", "found": true}, {"type": "without", "string": "Neue NASA-Fotos", "found": true}, {"type": "without", "string": "Videos zum Thema", "found": true}, {"type": "without", "string": "Beitr\u00e4ge aus dem Forum", "found": true}]}
{"file": "psl.eu.luniversite.html", "url": "https://www.psl.eu/actualites/luniversite-psl-quand-les-grandes-ecoles-font-universite", "text_len": 4165, "tp": 2, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Le d\u00e9cret n\u00b02019-1130 validant", "found": true}, {"type": "with", "string": "restructurant \u00e0 cet effet \u00bb.", "found": true}, {"type": "without", "string": " utilise des cookies pour", "found": false}, {"type": "without", "string": "En savoir plus", "found": false}, {"type": "without", "string": "CNRS, Inserm, Inria.", "found": true}]}
{"file": "hertha-blog.de.dame.html", "url": "http://www.hertha-blog.de/der-lange-und-die-alte-dame.html", "text_len": 5574, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In diesem Sommer war Michael Preetz", "found": true}, {"type": "with", "string": "Zeit als Spieler noch", "found": true}, {"type": "with", "string": "die Entscheidung f\u00fcr Dardai", "found": true}, {"type": "without", "string": "Drei Berliner kommentieren ihre Erlebniss", "found": false}, {"type": "without", "string": "\u201cHertha? Ist das dein Ernst?\u201d", "found": false}, {"type": "without", "string": "Beliebte Beitr\u00e4ge zum Thema:", "found": false}]}
{"file": "fifplay.com.settings.html", "url": "https://www.fifplay.com/fifa-21-game-settings/", "text_len": 9957, "tp": 4, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "You are able to customise and adjust the settings", "found": true}, {"type": "with", "string": "Your Default Game Lanaguage", "found": true}, {"type": "with", "string": "By setting this to Default, attributes are", "found": true}, {"type": "with", "string": "CPU GAMEPLAY CUSTOMISATION", "found": true}, {"type": "without", "string": "FIFA 21 Camera Settings", "found": false}, {"type": "without", "string": "Post Your Comments", "found": false}, {"type": "without", "string": "Shortcuts", "found": false}]}
{"file": "duengebehoerde-niedersachsen.de-Sperrfristen.html", "url": "https://www.duengebehoerde-niedersachsen.de/duengebehoerde/news/38853_Sperrfristende_01._Februar_-_Rechtliche_Hinweise_zur_N-D%C3%BCngung", "text_len": 10550, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "und damit auch mit Wirtschaftsd\u00fcnger", "found": true}, {"type": "with", "string": ". Die Regelung gilt f\u00fcr Gr\u00fcnland und", "found": true}, {"type": "with", "string": "Aufgrund EU-Vorgaben wurde die Auslegung", "found": true}, {"type": "without", "string": "\u00fcberschwemmte B\u00f6den: D\u00fcngung verboten", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "Frost: Der Boden muss am Tag des Aufbringens v\u00f6llig", "found": false}]}
{"file": "ingenieur.de.kernfusion.html", "url": "https://www.ingenieur.de/technik/fachbereiche/energie/kernfusion-kann-die-energiequelle-der-sterne-energieprobleme-aus-der-welt-schaffen/", "text_len": 5762, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u00dcberall auf der Welt forscht man", "found": true}, {"type": "with", "string": "Das NIF-Team hat", "found": true}, {"type": "with", "string": "Kleiner Schritt zu einer gr\u00fcnen Energiequelle", "found": true}, {"type": "without", "string": "THEMEN IM ARTIKEL", "found": false}, {"type": "without", "string": "TOP 5 ENERGIE", "found": false}, {"type": "without", "string": "12.12.2022, 08:30 Uhr", "found": false}]}
{"file": "reporternewspapers.net-Brookhaven.html", "url": "https://roughdraftatlanta.com/2023/11/08/brookhaven-village-closed-due-to-gas-leak/", "text_len": 679, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Brookhaven Police Department is reporting", "found": false}, {"type": "with", "string": "a construction company struck another gas line in the area of Dresden Drive", "found": false}, {"type": "with", "string": "near Parkside Drive. Road closure signs have been placed to shut the roadway down.", "found": false}, {"type": "without", "string": "TRENDING ON ROUGH DRAFT", "found": false}, {"type": "without", "string": "RECENT STORIES", "found": false}, {"type": "without", "string": "PROUDLY POWERED BY NEWSPACK BY AUTOMATTIC", "found": false}]}
{"file": "it-for-kids.org.variables.html", "url": "https://it-for-kids.org/blog/191211_variables/", "text_len": 205, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Wie war das nochmal mit den Variablen", "found": true}, {"type": "with", "string": "Variablen sind kein Problem f\u00fcr dich?", "found": true}, {"type": "with", "string": "Auszug aus unseren Lehrmaterialien", "found": true}, {"type": "without", "string": "Copyright \u00a9 2020 IT4Kids", "found": false}, {"type": "without", "string": "Impressum", "found": false}]}
{"file": "seglerblog.st\u00f6ssenseer.de.sauber.html", "url": "https://seglerblog.st\u00f6ssenseer.de/haltet-unsere-gewaesser-sauber/", "text_len": 403, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der Plakatwettbewerb f\u00fcr Kinder", "found": true}, {"type": "with", "string": "Gestalte ein Plakat unter dem", "found": true}, {"type": "with", "string": "an die Berliner*innen", "found": false}, {"type": "without", "string": "Finde im SeglerBlog!", "found": false}, {"type": "without", "string": "Verwandte Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}]}
{"file": "mdavis.xyz.supermarket.html", "url": "https://www.mdavis.xyz/supermarket/", "text_len": 8135, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The cameras recognise me as soon as I", "found": true}, {"type": "with", "string": "afternoon snack on way home from work", "found": true}, {"type": "with", "string": " FoodCorp to feed ourselves, FoodCorp feeds on us", "found": true}, {"type": "without", "string": "11 Jan 2019", "found": false}, {"type": "without", "string": "Photo by ev on Unsplash", "found": false}, {"type": "without", "string": "find more by Matthew Davis", "found": false}]}
{"file": "jaegermagazin.de-s\u00fcdtirol.html", "url": "https://www.jaegermagazin.de/jagd-aktuell/news-fuer-jaeger/suedtirol-woelfe-toeten-hund-und-bedrohen-besitzer/", "text_len": 2087, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Woche ereignete sich in S\u00fcdtirol eine", "found": true}, {"type": "with", "string": "Folgaria gemacht haben. Der", "found": true}, {"type": "with", "string": "Als sich die W\u00f6lfe immer noch", "found": true}, {"type": "without", "string": "Hundemeute oder Soloj\u00e4ger?", "found": false}, {"type": "without", "string": "Nutria bejagen und verwerten", "found": false}, {"type": "without", "string": "Neuentdeckung: Die wahren", "found": false}]}
{"file": "skispringen.com-verpasst.html", "url": "https://www.skispringen.com/marita-kramer-verpasst-olympische-spiele-in-peking/", "text_len": 2727, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Spiele in Peking werden ohne die gro\u00dfe Top", "found": true}, {"type": "with", "string": "Ich habe so viel Energieund Zeit investiert", "found": true}, {"type": "with", "string": "die Einzel-Entscheidung auf", "found": true}, {"type": "without", "string": "\u00dcber Luis Holuch", "found": false}, {"type": "without", "string": "Ryoyu Kobayashi gewinnt die 70.", "found": false}, {"type": "without", "string": "NATIONENCUP 2021/2022", "found": false}]}
{"file": "peta.de-veterin\u00e4r\u00e4mter.html", "url": "https://www.peta.de/neuigkeiten/veterinaeraemter-2021/", "text_len": 12096, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "f\u00fcr die \u00dcberwachung und den", "found": true}, {"type": "with", "string": "immer die gesamte Beh\u00f6rde", "found": true}, {"type": "with", "string": "Unterschreiben Sie unsere Petition", "found": true}, {"type": "without", "string": "1. Kreisveterin\u00e4ramt", "found": true}, {"type": "without", "string": "VERWANDTE ARTIKEL", "found": false}, {"type": "without", "string": "Alle Blogbeitr\u00e4ge zu unseren", "found": false}]}
{"file": "bewusster-leben.de.hope.html", "url": "https://www.bewusster-leben.de/hope/", "text_len": 4042, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ein grauer Wintermorgen ", "found": true}, {"type": "with", "string": "Dem Wunder die Hand reichen", "found": true}, {"type": "with", "string": "In ihrem Buch \u201eKrafttiere", "found": true}, {"type": "without", "string": "Diesen Artikel teilen", "found": false}, {"type": "without", "string": "Weitere Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Startseite", "found": false}]}
{"file": "0a962f6bcd5649f7a7e6effa338df80d.html", "url": "https://neunzehn72.de/imac-5k-lightroom-performance-geloest-danke-an-die-community/", "text_len": 1005, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Ich freue mich wie ein kleines Kind.", "found": true}, {"type": "with", "string": "Jetzt rennt der iMac Pro wie Hulle", "found": true}, {"type": "with", "string": "Aufl\u00f6sung der 5K-Displays", "found": true}, {"type": "without", "string": "Ich mag jede Art von Fotografie", "found": true}, {"type": "without", "string": "Leave a Comment! ", "found": false}, {"type": "without", "string": "Ja, ich m\u00f6chte den w\u00f6chentlichen Newsletter bekommen", "found": false}]}
{"file": "courgage-online.de.HIV.html", "url": "https://www.courage-online.de/erfinderinnen-ann-kiessling-und-ihre-forschung-im-kampf-gegen-das-hiv-virus/", "text_len": 3187, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ann Kiessling hat viele wichtige", "found": true}, {"type": "with", "string": "Tausende von Texten zum Thema", "found": true}, {"type": "with", "string": "IVF vor \u00fcber", "found": true}, {"type": "without", "string": "Dir hat der Artikel gefallen? Jetzt teilen...", "found": false}, {"type": "without", "string": "Das eigene Limit infrage stellen", "found": false}, {"type": "without", "string": "Noch mehr Infos f\u00fcr dich", "found": false}]}
{"file": "heavenlynnhealthy.de.mareenburk.html", "url": "https://heavenlynnhealthy.de/lieblingslabel-faire-swimwear-von-mymarini-interview-mit-gruenderin-mareen-burk/", "text_len": 9757, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dies ist vielleicht ein Food Blog, ", "found": true}, {"type": "with", "string": "Meine Gr\u00fcndergeschichte", "found": true}, {"type": "with", "string": "Wir bei MYMARINI gehen von daher aus einer", "found": true}, {"type": "without", "string": "Kategorie:", "found": false}, {"type": "without", "string": "Folge mir", "found": false}, {"type": "without", "string": "Hallo!", "found": false}]}
{"file": "Journalistenwatch.com-Ladensterben.html", "url": "https://journalistenwatch.com/2023/11/01/ladensterben-immer-dramatischer/", "text_len": 4058, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der Handelsverband Deutschland (HDE)", "found": true}, {"type": "with", "string": "rechnet jetzt auch noch mit einem beschleunigten Ladensterben", "found": true}, {"type": "with", "string": "Ein Drittel der Mittelst\u00e4ndler will sein Gesch\u00e4ft lieber morgen als \u00fcbermorgen aufgeben", "found": true}, {"type": "without", "string": "Sch\u00fctzt Annalena Baerbock weiterhin iranische Terrorbanden?", "found": false}, {"type": "without", "string": "Das ist die Totenglocke dieser Regierung!", "found": false}, {"type": "without", "string": "Hupkonzerte und Rufe der Demonstranten in den Innenst\u00e4dten", "found": false}]}
{"file": "aktion-hummelschutz.de.hummeln.html", "url": "https://aktion-hummelschutz.de/biologie/tote-hummeln-unter-linden/", "text_len": 8551, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Normalerweise leben Hummeln", "found": true}, {"type": "with", "string": "Das Sterben tritt zur Bl\u00fctezeit", "found": true}, {"type": "with", "string": "Baal T, Denke B, M\u00fchlen", "found": true}, {"type": "without", "string": "War der Artikel n\u00fctzlich?", "found": false}, {"type": "without", "string": "Holen Sie sich meinen", "found": false}, {"type": "without", "string": "M\u00f6chten Sie den Artikel teilen?", "found": false}]}
{"file": "singapur-reiseinfo.de.abc.html", "url": "http://www.singapur-reiseinfo.de/Reise-ABC/reise-abc.html", "text_len": 17281, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Reiseinformationen durch das", "found": true}, {"type": "with", "string": "Einfuhrverbot: Waffen. Munition", "found": true}, {"type": "with", "string": "SARS kann bei Wiederauftreten", "found": true}, {"type": "without", "string": "\u00dcber 45.000 Ferienh\u00e4user", "found": false}, {"type": "without", "string": "Die folgenden Hotel Links", "found": false}]}
{"file": "vogelwarte.ch-aktionsplan.html", "url": "https://www.vogelwarte.ch/de/vogelwarte/news/avinews/dezember-2021/zielartenfoerderung-im-lichten-wald-dank-aktionsplan", "text_len": 3574, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "mikroklimatische Bedingungen in der Strauch", "found": true}, {"type": "with", "string": "BAFU, einen Aktionsplan \u00abZielartenf\u00f6rderung", "found": true}, {"type": "with", "string": " Lebensraumf\u00f6rderung mit der spezifischen Artenf\u00f6rderung", "found": true}, {"type": "without", "string": "und der Hirschk\u00e4fer (Lucanus cervus)", "found": false}, {"type": "without", "string": "beinhaltet auch die lichten W\u00e4lder, welche", "found": false}, {"type": "without", "string": "Kastanienselven beispielsweise", "found": false}]}
{"file": "pferderevue.at-\u00fcbung.html", "url": "https://www.pferderevue.at/aktuelles/ausbildung/2022/schluss-mit-poltern--vier-uebungen-fuer-einen-geschmeidigen-sitz.html", "text_len": 14483, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "poltert\u2019s bei Ihnen beim Aussitzen?", "found": false}, {"type": "with", "string": "Pferde selbst in den schwierigsten", "found": true}, {"type": "with", "string": "Kursen im In- und Ausland gemacht hat. Dieses", "found": true}, {"type": "without", "string": "Gro\u00dfe Beckenkreise (links) stabiliseren,", "found": false}, {"type": "without", "string": "Bei der Beckenkippung nach hinten sinkt der Brustkorb ein", "found": false}, {"type": "without", "string": "Das Buch & der Online-Lehrgang zum", "found": true}]}
{"file": "enwb.com.windpark.steinheim.html", "url": "https://www.enbw.com/unternehmen/presse/buergerbeteiligung-fuer-den-windpark-steinheim-startet.html", "text_len": 2049, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Steinheim, Nordrhein-Westfalen/Stuttgart", "found": true}, {"type": "with", "string": "Mit der B\u00fcrgerbeteiligung", "found": true}, {"type": "with", "string": "\u00dcber die digitale", "found": true}, {"type": "without", "string": "Die EnBW Energie Baden-W\u00fcrttemberg AG ist:", "found": false}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "Zur\u00fcck zum Newsroom", "found": false}]}
{"file": "bibliothek2null.de.mai.html", "url": "http://www.bibliothek2null.de/2014/05/18/alles-neue-mach-der-mai/", "text_len": 1141, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nachdem ich mein Blog", "found": true}, {"type": "with", "string": "Der Anfang ist gemacht", "found": true}, {"type": "with", "string": "Ich hoffe euch gef\u00e4llt der Relaunch.", "found": true}, {"type": "without", "string": "Deine E-Mail-Adresse wird", "found": false}, {"type": "without", "string": "bei Informationspraxis- ein neues", "found": false}, {"type": "without", "string": "Permalink", "found": false}]}
{"file": "campino2k.de.uberspace.html", "url": "https://campino2k.de/2016/02/28/uberspace-und-lets-encrypt/", "text_len": 1089, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Nachdem bei Uberspace jetzt", "found": true}, {"type": "with", "string": "Die Anpassung der entsprechenden", "found": true}, {"type": "with", "string": "bei Projekten mit WordPress", "found": true}, {"type": "without", "string": "Hier schreibt Christian", "found": false}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}]}
{"file": "geburtstagsecke.de.ideen.html", "url": "https://www.geburtstagsecke.de/ideen", "text_len": 2257, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die richtigen Ideen f\u00fcr den", "found": true}, {"type": "with", "string": "Daher ist es sinnvoll das Kind in die Planung", "found": true}, {"type": "with", "string": "Ihr solltet aber auf jeden Fall", "found": true}, {"type": "without", "string": "\u00a9 2019 geburtstagsecke.de", "found": false}, {"type": "without", "string": "Geburtstage f\u00fcr Erwachsene planen und feiern", "found": false}, {"type": "without", "string": "Beliebte Tags", "found": false}]}
{"file": "edition.cnn.com-royal.html", "url": "https://edition.cnn.com/2021/03/08/uk/meghan-harry-oprah-interview-recap-scli-gbr-intl/index.html", "text_len": 14159, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The duchess has hinted", "found": true}, {"type": "with", "string": "broach the topic", "found": true}, {"type": "with", "string": "Harry also criticized", "found": true}, {"type": "without", "string": "baby's skin color", "found": false}, {"type": "without", "string": "PAID CONTENT", "found": false}, {"type": "without", "string": "Berlin: Eine Senior-Dating", "found": false}]}
{"file": "impulse.de.eltern.html", "url": "https://www.impulse.de/recht-steuern/rechtsratgeber/kind-krank/7297147.html", "text_len": 10914, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wie viele Tage im Jahr d\u00fcrfen Mitarbeiter", "found": false}, {"type": "with", "string": "Gibt es dabei eine Altersgrenze f\u00fcr die Kinder?", "found": true}, {"type": "with", "string": "Man kann den Anspruch auf Kinderkrankentage", "found": true}, {"type": "without", "string": "TERMINE F\u00dcR UNTERNEHMER", "found": false}, {"type": "without", "string": "2023 nichts mehr vers\u00e4umen!", "found": false}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}]}
{"file": "publishedreporter.com-Hottest.html", "url": "https://www.publishedreporter.com/2023/11/08/scientists-confirm-2023-as-hottest-year-ever-in-the-making/", "text_len": 2772, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "From the Copernicus Climate Change Service", "found": true}, {"type": "with", "string": "Samantha Burgess confirms with high certainty", "found": true}, {"type": "with", "string": "that the global temperature has surpassed pre-industrial averages", "found": true}, {"type": "without", "string": "Advertising Disclosure", "found": false}, {"type": "without", "string": "This site participates in the Amazon Associate program", "found": false}, {"type": "without", "string": "and earns revenue from qualifying purchases", "found": false}]}
{"file": "chocolate.com.pregnant.html", "url": "https://www.chocolate.com/view/woman-sees-a-car-stop-for-pregnant-beggar-this-is-what-she-finds-when-she-follows/&page=2", "text_len": 427, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Could it be true? Was she trying", "found": true}, {"type": "with", "string": "working to catch those who run operations", "found": false}, {"type": "with", "string": "she was lucky enough to receive a", "found": false}, {"type": "without", "string": "CHOCOLATE.COM2020", "found": false}, {"type": "without", "string": "Terms Of Service", "found": false}, {"type": "without", "string": "DMCA", "found": false}]}
{"file": "houzz.de-Projekte.html", "url": "https://www.houzz.de/magazin/best-of-houzz-2022-das-sind-die-beliebtesten-projekte-auf-houzz-stsetivw-vs~157401545", "text_len": 7249, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Projekte, die bei den Millionen", "found": true}, {"type": "with", "string": "zu den Projekten, die", "found": true}, {"type": "with", "string": "Ausz\u00fcgen hat es der Community", "found": true}, {"type": "without", "string": "Verraten Sie gerne in den Kommentaren:", "found": true}, {"type": "without", "string": "\u00c4hnliche Artikel lesen", "found": false}, {"type": "without", "string": "Nutzer mochten auch folgende", "found": false}]}
{"file": "nwx.new-work.se.digitaler-stress.html", "url": "https://nwx.new-work.se/themenwelten/gesellschaft/umfrage-zur-digitalisierung-am-arbeitsplatz-mitbestimmung-und-vertrauen-reduziert-digitalen-stress", "text_len": 4030, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Die Potenziale der Digitalisierung", "found": true}, {"type": "with", "string": "\u201eCorona hatte einen regelrechten", "found": true}, {"type": "with", "string": "*Mit der repr\u00e4sentativen Befragung", "found": true}, {"type": "without", "string": "Weitere aktuelle Themen aus der Arbeitswelt", "found": true}, {"type": "without", "string": "Schwerpunkte", "found": false}, {"type": "without", "string": "Magazin", "found": false}]}
{"file": "gruen-digital.de.jahrestagung.html", "url": "https://www.gruen-digital.de/2015/01/digitalpolitisches-jahrestagung-2015-der-heinrich-boell-stiftung-baden-wuerttemberg/", "text_len": 5002, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Prof. Dr. Caja Thimm", "found": true}, {"type": "with", "string": "zur Anmeldung.", "found": true}, {"type": "without", "string": "Next post", "found": false}, {"type": "without", "string": "Aus den L\u00e4ndern", "found": false}]}
{"file": "pamelaandersonfoundation.org.yellow.html", "url": "https://www.pamelaandersonfoundation.org/news/2018/12/4/yellow-vests-and-i", "text_len": 5342, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "I am glad that the media", "found": true}, {"type": "with", "string": "Lots of media see Yellow Vests", "found": true}, {"type": "with", "string": "Moralising about burned", "found": true}, {"type": "without", "string": "John Bitove, Chair Priszm Brandz", "found": false}, {"type": "without", "string": "January 2020", "found": false}, {"type": "without", "string": "Oct 9, 2019", "found": false}]}
{"file": "businessjargons.com.leadership.html", "url": "https://businessjargons.com/leadership-styles.html", "text_len": 4104, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "the way he gives directions to his subordinates and ", "found": true}, {"type": "with", "string": "The leadership styles can either be classified on", "found": true}, {"type": "with", "string": "adopts to influence the behavior of his subordinates.", "found": true}, {"type": "without", "string": "Effective Communication", "found": false}, {"type": "without", "string": "International Marketing", "found": false}, {"type": "without", "string": "Communication Process", "found": false}]}
{"file": "Sieci_ IPN, czyli element infrastruktury krytycznej Tygodnik Sieci.html", "url": "https://www.wsieciprawdy.pl/sieci-ipn-czyli-element-infrastruktury-krytycznej-pnews-4715.html", "text_len": 3480, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Zadania Instytutu Pami\u0119ci", "found": true}, {"type": "with", "string": "co zechc\u0105 - czytamy.", "found": true}, {"type": "with", "string": "\u0142amach nowego wydania", "found": true}, {"type": "without", "string": "opublikowano:", "found": false}, {"type": "without", "string": "Zobacz tak\u017ce", "found": false}, {"type": "without", "string": "Zapraszamy te\u017c do subskrypcji", "found": true}]}
{"file": "islamische-zeitung.de-Bundespr\u00e4sident.html", "url": "https://islamische-zeitung.de/bundespraesident-sieht-radikalisierung-bei-querdenkern-und-corona-leugnern/", "text_len": 1548, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "eigenen Worten eine \u201ezunehmende", "found": true}, {"type": "with", "string": "Bundeskriminalamts im \u201ef\u00f6deralen Sicherheitsgef\u00fcge\u201c", "found": true}, {"type": "with", "string": "Verbindungen in weite Teile", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Anzeige: Mehr lesen mit dem IZ+ Abo", "found": false}, {"type": "without", "string": "Corona & die Folgen, Debatte", "found": false}]}
{"file": "kulturnews.de-Deutschland-Tour.html", "url": "https://kulturnews.de/fensterputzen-mit-den-ratboys-the-window-live/", "text_len": 1021, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "F\u00fcr Julia Steiner, S\u00e4ngerin und Frontfrau der Ratboys", "found": true}, {"type": "with", "string": "war eines unausweichlich", "found": true}, {"type": "with", "string": "Das neue Album der Postcountryband musste den Titel", "found": true}, {"type": "without", "string": "Brecht Reloaded: \u201eWie der Schnee\u201c \u2013 die neue Single von Soeckers", "found": false}, {"type": "without", "string": "Gef\u00fchle wie Rohdiamanten: \u201estrawberry picking\u201c \u2013 die neue Single von being anne", "found": false}, {"type": "without", "string": "Befreite Beats: \u201eKalter Rauch\u201c \u2013 das Singledeb\u00fct von HUND", "found": false}]}
{"file": "world.kbs.co.kr-Temperatures.html", "url": "https://world.kbs.co.kr/service/news_view.htm?lang=e&Seq_Code=181595", "text_len": 1601, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Although the first cold wave alerts of the season were issued in anticipation of frigid morning lows on Tuesday", "found": true}, {"type": "with", "string": "Wednesday is forecast to be even colder.", "found": true}, {"type": "with", "string": "People out on the streets were seen wearing layers throughout the day as Tuesday\u2019s temperatures", "found": true}, {"type": "without", "string": "Most Viewed News", "found": false}, {"type": "without", "string": "Headline News", "found": false}, {"type": "without", "string": "Most Viewed Content", "found": false}]}
{"file": "lapresse.tn.parite.html", "url": "https://lapresse.tn/48915/parite-hommes-femmes-en-tunisie-au-dessous-de-la-moyenne-mondiale/", "text_len": 2959, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Malgr\u00e9 les acquis l\u00e9gislatifs", "found": true}, {"type": "with", "string": "Des actions \u00e0 entreprendre", "found": true}, {"type": "with", "string": "assurer l\u2019\u00e9galit\u00e9 des chances", "found": true}, {"type": "without", "string": "Apr\u00e8s une mise en quarantaine", "found": false}, {"type": "without", "string": "des moments dans le parcours historique", "found": false}, {"type": "without", "string": "partiellement nuageux", "found": false}]}
{"file": "archive.org.rent-a-pastor.com.hochzeitslokation.html", "url": "https://web.archive.org/web/20150721045344/http://rent-a-pastor.com/2015/05/18/neue-hochzeitslokation-in-roedermark-hessen-geheimtipp/", "text_len": 3336, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "am Parkhotel vorbei gefahren und habe \u00fcber das weitr\u00e4umige Gel\u00e4nde gestaunt", "found": true}, {"type": "with", "string": "auch einen unglaublichen 5000 m2 Park mit See und Springbrunnen", "found": true}, {"type": "with", "string": "Redner in der Region findest Du", "found": true}, {"type": "without", "string": "Kommentar verfassen", "found": false}, {"type": "without", "string": "Melden Sie sich f\u00fcr unseren Newsletter an", "found": false}, {"type": "without", "string": "Di-Fr 10-18:00 Uhr. ", "found": false}]}
{"file": "werkzeugforum.de-heizjacke.html", "url": "https://www.werkzeugforum.de/heizjacken-von-bosch/", "text_len": 3784, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Profis binnen drei Minuten auf \u201eBetriebstemperatur\u201c", "found": true}, {"type": "with", "string": "geb\u00fcckter Haltung effizient gew\u00e4rmt. Die Jacke", "found": true}, {"type": "with", "string": "jeweils in den Unisex-Gr\u00f6\u00dfen", "found": true}, {"type": "without", "string": "Mauerschlitze fr\u00e4sen", "found": false}, {"type": "without", "string": "Eine Antwort schreiben", "found": false}, {"type": "without", "string": "Ausbildungsverg\u00fctung: Was", "found": false}]}
{"file": "meininger.de-wachstum.html", "url": "https://www.meininger.de/wein/erzeuger/lvmh-mit-ordentlichem-wachstum", "text_len": 1126, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "meldet f\u00fcr 2021 einen Umsatz von 64,2", "found": true}, {"type": "with", "string": "Wichtige Brands sind etwa die Champagnermarken", "found": true}, {"type": "with", "string": "Joint Venture Cheval des Andes", "found": true}, {"type": "without", "string": "Unsere neue Rubrik. Zum Auftakt fragen", "found": false}, {"type": "without", "string": "Italien-Fans alles, was das Herz begehrt", "found": false}, {"type": "without", "string": "Sektkellerei am", "found": false}]}
{"file": "nestle-marktplatz.de-produkttest.html", "url": "https://www.nestle-marktplatz.de/mitmachen/produkttests", "text_len": 7020, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "k\u00f6nnen Sie die Einstellung ganz", "found": true}, {"type": "with", "string": "auf Foren und Blogs, teilen Sie", "found": true}, {"type": "with", "string": "Wir z\u00e4hlen auf Ihre Meinung", "found": true}, {"type": "without", "string": "Aktuelle Produkttests", "found": false}, {"type": "without", "string": "NESQUIK Trinkfertig", "found": false}, {"type": "without", "string": "Wie l\u00e4uft ein Produkttest ab", "found": false}]}
{"file": "eluniversal.com-senador.html", "url": "https://www.eluniversal.com/internacional/125703/senador-republicano-califica-a-biden-de-incapacitado", "text_len": 3710, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "y confundido. No sabe d\u00f3nde est\u00e1 la mitad del tiempo.", "found": true}, {"type": "with", "string": "en alusi\u00f3n a la marca Make America", "found": true}, {"type": "with", "string": "sobre la declaraci\u00f3n de Scott, Biden sonri\u00f3 y dijo", "found": true}, {"type": "without", "string": "Siguenos en Telegram, Instagram, Facebook y Twitter", "found": false}, {"type": "without", "string": "Lluvias en Colombia dejan 47 fallecidos", "found": false}, {"type": "without", "string": "Emmanuel presentar\u00e1 en", "found": false}]}
{"file": "tafelblog.de.europa.html", "url": "https://www.tafelblog.de/welches-europa-wir-wollen/", "text_len": 1946, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Knapp zwei Tage vor der Europawahl", "found": true}, {"type": "with", "string": "Die Ergebnisse der B\u00fclow-Wahl", "found": true}, {"type": "with", "string": "bei uns viele Stimmen hinzugewinnen", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Aachen 1933 \u2013 1945", "found": false}, {"type": "without", "string": "Meinen Namen, E-Mail", "found": false}]}
{"file": "caymancompass.com-prison.html", "url": "https://www.caymancompass.com/2022/05/04/prison-official-anyone-could-escape-from-northward/", "text_len": 353, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The evidence was given in support of a decision", "found": false}, {"type": "with", "string": "provided by the most dangerous and high risk offenders.\u201d", "found": false}, {"type": "with", "string": "added that the prison estate was not considered", "found": false}, {"type": "without", "string": "The prison official\u2019s affidavit highlights security", "found": false}, {"type": "without", "string": "You have 4 free articles left this month", "found": false}, {"type": "without", "string": "Previous article", "found": false}]}
{"file": "instyle.com.cancer.html", "url": "https://www.instyle.com/beauty/wigs-for-black-women-cancer", "text_len": 7285, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "decided to ditch her relaxer and transition back", "found": true}, {"type": "with", "string": "to see themselves provides privacy and dignity.", "found": true}, {"type": "with", "string": "All women, regardless of hair type, should", "found": true}, {"type": "without", "string": "Scroll Down For the Next Article", "found": false}, {"type": "without", "string": "A lot of the royal families had these", "found": false}, {"type": "without", "string": "On the other hand, Black doo-wop girl", "found": false}]}
{"file": "wochenblatt.com-Heinen-Essen.html", "url": "https://www.wochenblatt.com/landwirtschaft/agrarpolitik/heinen-esser-offen-fuer-existenzgruendungspraemie-12810183.html", "text_len": 2376, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Die Jugendverb\u00e4nde der Landwirtschaft in", "found": true}, {"type": "with", "string": "Die Jugendverb\u00e4nde der Landwirtschaft in", "found": true}, {"type": "with", "string": "besprach sie Fragen zur erwartenden", "found": true}, {"type": "without", "string": "Vertreterinnen und Vertreter der", "found": false}, {"type": "without", "string": "Jugendverb\u00e4nde fordern", "found": false}, {"type": "without", "string": "Die Jugendverb\u00e4nde der", "found": true}]}
{"file": "gruene-bundestag.de-COP26.html", "url": "https://www.gruene-bundestag.de/themen/klimaschutz/cop26-in-glasgow", "text_len": 3587, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es ist h\u00f6chste Zeit", "found": true}, {"type": "with", "string": "Versprechen, ab 2020 j\u00e4hrlich", "found": true}, {"type": "with", "string": "Die Initiative der britischen", "found": true}, {"type": "without", "string": "Andrew Milligan", "found": false}, {"type": "without", "string": "Mehr Klimaschutz", "found": false}, {"type": "without", "string": "1,5 Grad-Pfad zu kommen.", "found": false}]}
{"file": "bmbf.de.energiewende.html", "url": "https://www.bmbf.de/bmbf/de/forschung/energiewende-und-nachhaltiges-wirtschaften/energiewende-und-nachhaltiges-wirtschaften_node.html", "text_len": 3164, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "L\u00e4ndliche Regionen schrumpfen", "found": true}, {"type": "with", "string": "Die Bundesregierung investiert", "found": true}, {"type": "with", "string": "mit vielf\u00e4ltigen Forschungsprojekten", "found": true}, {"type": "without", "string": "Thinkstock", "found": false}, {"type": "without", "string": "Chancen f\u00fcr eine biobasierte", "found": false}, {"type": "without", "string": "Folgen Sie uns", "found": false}]}
{"file": "insubordinant.wordpress.com.speed.html", "url": "https://insubordinant.wordpress.com/2015/08/11/need-for-speed/", "text_len": 3765, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der kleine Junge bremst abrupt vor mir", "found": true}, {"type": "with", "string": "Kein Kerl ist das wert, Kleines", "found": true}, {"type": "with", "string": "dem kleinen Polo so viel Gas wie er gerade", "found": true}, {"type": "without", "string": "5 Bloggern gef\u00e4llt das.", "found": false}, {"type": "without", "string": "Gedanken zu \u201cNeed for Speed\u201d", "found": false}, {"type": "without", "string": "Ver\u00f6ffentlicht in:", "found": false}]}
{"file": "thepointsguy.com.alaska.html", "url": "https://thepointsguy.com/news/alaska-airlines-oneworld-membership-new-date/", "text_len": 3915, "tp": 3, "fn": 0, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "has a new date for when it will be a full fledged member of the Oneworld", "found": true}, {"type": "with", "string": "at its Seattle/Tacoma International Airport (SEA) base in 2019.", "found": true}, {"type": "with", "string": "hat it launched in 2020, according to Cirium", "found": true}, {"type": "without", "string": "This post contains references to products from one or more", "found": true}, {"type": "without", "string": "Bonus value is an estimated value calculated by", "found": true}, {"type": "without", "string": "responsibility to ensure all posts and/or questions are answered.", "found": true}]}
{"file": "deutsche-handwerkszeitung.de-eigentumsvorbehalt.html", "url": "https://www.deutsche-handwerks-zeitung.de/eigentumsvorbehalt-das-sollten-kaeufer-und-verkaeufer-wissen-168384/", "text_len": 6674, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u00fcbergibt der Verk\u00e4ufer dem K\u00e4ufer die", "found": true}, {"type": "with", "string": "der K\u00e4ufer dem Verk\u00e4ufer zu, das Eigentum", "found": true}, {"type": "with", "string": "Lieferungen beglichen wurden. Ein", "found": true}, {"type": "without", "string": "Sie werkt\u00e4glich, was erfolgreiche", "found": false}, {"type": "without", "string": "Stapel mit Mauerziegeln: Wenn ein", "found": false}, {"type": "without", "string": "WEITERE BEITR\u00c4GE ZU", "found": false}]}
{"file": "gelbe-liste.de-chininum.html", "url": "https://www.gelbe-liste.de/produkte/Chininum-salicylicum-D4-DHU-Tabletten_433873", "text_len": 6542, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gebrauchsinformation", "found": false}, {"type": "with", "string": "Keine Basisinformation zu diesem", "found": true}, {"type": "with", "string": "Hersteller bereitgestellt", "found": true}, {"type": "without", "string": "Mit der Identa-Suche", "found": false}, {"type": "without", "string": "bei Eisenmangel", "found": false}, {"type": "without", "string": "Zusatzinfos f\u00fcr", "found": false}]}
{"file": "ahlen.de.reparaturcafe.html", "url": "https://www.ahlen.de/start/aktuelles/aktuelle/information/nachricht/aus-ahlen/reparaturcafe-am-31-januar/", "text_len": 961, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Jede Menge Spa\u00df bereitet es den", "found": false}, {"type": "with", "string": "Das Projekt ist eine Kooperationsveranstaltung", "found": true}, {"type": "with", "string": "althausa@stadt.ahlen.de", "found": true}, {"type": "without", "string": "Stadtverwaltung Ahlen Rechnungseingang", "found": false}, {"type": "without", "string": "Internetredaktion Stadt Ahlen", "found": false}, {"type": "without", "string": "Allgemeine Sprechstunden der Verwaltung", "found": false}]}
{"file": "baike.baidu.com.tanya.html", "url": "https://baike.baidu.com/item/%E8%94%A1%E5%81%A5%E9%9B%85", "text_len": 9430, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "1975\u5e741\u670828\u65e5\u51fa\u751f", "found": false}, {"type": "with", "string": "\u72ec\u7acb\u5236\u4f5c", "found": true}, {"type": "with", "string": "2000\u5e74\u5728\u65b0\u52a0\u5761", "found": true}, {"type": "without", "string": "\u539f\u6728\u6e23\u7537", "found": false}, {"type": "without", "string": "\u7f51\u53cb\u5370\u8c61", "found": false}, {"type": "without", "string": "\u767e\u79d1\u8bcd", "found": false}]}
{"file": "archive.org.steinzeitwissen.de.werkzeuge.html", "url": "https://web.archive.org/web/20150206075900/http://www.steinzeitwissen.de/artefakttypen/werkzeuge-des-neandertalers-und-des-modernen-menschen", "text_len": 6435, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "erk\u00adzeug\u00adty\u00adpen und ihre Lauf\u00adzei\u00adten be\u00adhan\u00addelt.", "found": false}, {"type": "with", "string": "uge und sah sich of\u00adfen\u00adbar nicht ver\u00adan\u00adlasst, die Kern\u00adwerk\u00adzeuge zu \u00fcbernehmen.", "found": false}, {"type": "with", "string": "m Alt\u00adpa\u00adl\u00e4o\u00adli\u00adthi\u00adkum bis in die Neu\u00adzeit, T\u00fc\u00adbin\u00adgen 2012, Kerns Ver\u00adlag, S. 426", "found": false}, {"type": "without", "string": "Proudly powered by WordPress.", "found": false}, {"type": "without", "string": "\u00dcberblick + Sch\u00fclerhilfe", "found": false}, {"type": "without", "string": "Artikel Mittelpal\u00e4olithikum", "found": false}]}
{"file": "zdnet.de.facebook.html", "url": "https://www.zdnet.de/88298335/facebook-wehrt-sich-gegen-maas-gesetz", "text_len": 3554, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "esjustizminister Heiko Maas ge\u00e4u\u00dfert, per Gesetz \u201eCompliance-Regeln f\u00fcr Soziale Netzwerke\u201c e", "found": true}, {"type": "with", "string": "acebook zus\u00e4tzliche Kosten von 530 Millionen Euro pro Jahr zukommen, f\u00fcr \u201erealistisch\u201c.", "found": true}, {"type": "with", "string": "nste anbieten. W\u00e4hrend beispielsweise die Leugnung des Holocaust hierzulande unter Str", "found": true}, {"type": "without", "string": "Whitepaper", "found": false}, {"type": "without", "string": "Bericht: Apple k\u00fcndigt zur WWDC 13,3-Zoll-MacBook und 24-Zoll-iMac mit ARM-Prozessoren an", "found": false}, {"type": "without", "string": "erden Sie die Corona Warn-App der Bundesregierung verwenden?", "found": false}]}
{"file": "economist.com.thinking.html", "url": "https://www.economist.com/open-future/2018/06/18/why-collaborative-thinking-beats-individual-smarts", "text_len": 11766, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "about the role that the proportion of men and women in", "found": true}, {"type": "with", "string": "You might call this a measure of a person", "found": true}, {"type": "with", "string": "Can groups be intelligent in the same way individuals", "found": true}, {"type": "without", "string": "Sign up to our free daily newsletter", "found": false}, {"type": "without", "string": "Published since September 1843 to take part in", "found": false}, {"type": "without", "string": "Jun 18th 2018", "found": false}]}
{"file": "bundesrat.de-erinnerungen.html", "url": "https://www.bundesrat.de/SharedDocs/texte/22/20220127-weremember-gedenkstunde-kranzniederlegung.html;jsessionid=FD52ED97F4C3551B332D2AA670DAE45C.1_cid382", "text_len": 5748, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "wurde als Siebenj\u00e4hrige von Stuttgart", "found": true}, {"type": "with", "string": "Neben der gastgebenden Bundestagspr\u00e4sidentin", "found": true}, {"type": "with", "string": "als Zeichen des Gedenkens an die Opfer", "found": true}, {"type": "without", "string": "Presse- und Informationsamt der Bundesregierung | Jesco Denzel", "found": false}, {"type": "without", "string": " Bundesrat | Frank Br\u00e4uer", "found": true}, {"type": "without", "string": "Ist dieser Beitrag hilfreich?", "found": false}]}
{"file": "pferd-aktuell.de-stellungnahmen.html", "url": "https://www.pferd-aktuell.de/news/aktuelle-meldungen/zucht/stellungnahme-der-fn-zum-hlp-pilotjahr-2022", "text_len": 2060, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bereits seit Jahren haben sich die Zuchtverb\u00e4nde", "found": true}, {"type": "with", "string": "Pferde altersgem\u00e4\u00df stattfindet und im Einklang", "found": true}, {"type": "with", "string": "Veranlagungspr\u00fcfung von Hengsten der deutschen", "found": true}, {"type": "without", "string": "zur\u00fcck zur vorherigen Seite", "found": false}, {"type": "without", "string": "HLP: Zuchtverb\u00e4nde planen 2022 als Pilotjahr", "found": false}, {"type": "without", "string": "TSF Dalera BB: T\u00e4nzerin im", "found": false}]}
{"file": "helge.at.mahu.html", "url": "http://www.helge.at/2014/03/warum-wien-zu-blod-fur-eine-staufreie-mahu-ist/", "text_len": 2805, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die \u201cKrone\u201d zitiert heute meinen", "found": true}, {"type": "with", "string": "die rote Personalvertretung der Wiener Linien", "found": true}, {"type": "with", "string": "Bl\u00f6d sind also nicht die Wiener", "found": true}, {"type": "without", "string": "Warum Michel Reimon nach Br\u00fcssel muss", "found": false}, {"type": "without", "string": "Helge Fahrnberger's personal pages", "found": false}, {"type": "without", "string": "Provider information ", "found": false}]}
{"file": "alexanderlasch.wordpress.com.sprachgeschichte.html", "url": "https://alexanderlasch.wordpress.com/2019/11/14/was-das-christkind-und-native-americans-gemeinsam-haben-oder-warum-wir-sprachgeschichte-brauchen/", "text_len": 6093, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Wenn man sich heutzutage", "found": true}, {"type": "with", "string": "An dieser und anderer Stelle", "found": true}, {"type": "with", "string": "Genau dieses Bild ruft die AfD", "found": true}, {"type": "without", "string": "Es gibt noch keine Kommentare.", "found": false}, {"type": "without", "string": "Das setzt das Verst\u00e4ndnis voraus", "found": true}, {"type": "without", "string": "Alle Artikel und Inhalte", "found": false}]}
{"file": "waldwiesen.net-holl\u00e4nderholzhandel.html", "url": "https://www.waldwissen.net/de/lernen-und-vermitteln/der-hollaenderholzhandel", "text_len": 11814, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Heute l\u00e4ngst vergessen, war der Holzhandel", "found": false}, {"type": "with", "string": "Vom 17. bis ins 19. Jahrhundert war der Begriff ", "found": true}, {"type": "with", "string": "Drittl\u00e4nder eintreffen. Auch der russische", "found": true}, {"type": "without", "string": "Originalartikel", "found": false}, {"type": "without", "string": "Lernen und Vermitteln", "found": false}, {"type": "without", "string": "Wissenstransfer, \u00d6ffentlichkeitsarbeit, Waldp\u00e4dagogik", "found": false}]}
{"file": "auto-motor.at-hyundaitest.html", "url": "https://auto-motor.at/Hyundai/Tests/Hyundai-Santa-Fe-Plug-in-Test.html", "text_len": 7980, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Santa Fe ist weit", "found": false}, {"type": "with", "string": "Ausstattung Sicherheit: 1", "found": true}, {"type": "with", "string": "CO2 Aussto\u00df pro km in", "found": true}, {"type": "without", "string": "Die neuesten Meldungen", "found": false}, {"type": "without", "string": "Der neue SL ist erstmals", "found": false}, {"type": "without", "string": "Test verraten wir", "found": false}]}
{"file": "tennismagazin.de-viertelfinale.html", "url": "https://www.tennismagazin.de/news/zverev-zieht-ins-viertelfinale-von-montpellier-ein/", "text_len": 1442, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "besa\u00df der mit einer Wildcard ausgestattete", "found": true}, {"type": "with", "string": "Niederlage gegen Jonathan Erlich/Edouard", "found": true}, {"type": "with", "string": "Achtelfinal-Aus gegen Denis Shapovalov", "found": true}, {"type": "without", "string": "Alexander Zverev steht im Viertelfinale des ATP-Turniers", "found": false}, {"type": "without", "string": "AUCH AUF TENNISMAGAZIN.DE", "found": false}, {"type": "without", "string": "Ein Kommentar von tennis", "found": false}]}
{"file": "be.ch-impfen.html", "url": "https://www.be.ch/de/start/dienstleistungen/medien/medienmitteilungen.html?newsID=c3aa546f-24d3-4b47-9c0c-59db58b2f725", "text_len": 1952, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "daher die zus\u00e4tzlich aufgebauten Impforte", "found": true}, {"type": "with", "string": "schwere Krankheitsverl\u00e4ufe zu sch\u00fctzen.", "found": true}, {"type": "with", "string": "eine Kartenansicht umgestellt werden.", "found": true}, {"type": "without", "string": "Seite teilen", "found": false}, {"type": "without", "string": "Inhalt", "found": false}, {"type": "without", "string": "Zur\u00fcck zur \u00dcbersicht", "found": false}]}
{"file": "theoriginalcopy.de.baby.html", "url": "https://theoriginalcopy.de/editors-letter-baby/", "text_len": 6741, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Lange habe ich diesen", "found": true}, {"type": "with", "string": "W\u00e4hrend ich diese Wort", "found": true}, {"type": "with", "string": "Bis dahin halte ich Euch auf Instagram ", "found": true}, {"type": "without", "string": "Teilen", "found": false}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Copyright 2022", "found": false}]}
{"file": "metrotimes.com-Mezcal.html", "url": "https://www.metrotimes.com/food-drink/detroits-mezcal-restaurant-goes-beyond-familiar-mexican-fare-34565910", "text_len": 5406, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The Mariachi Mexico 2020 quartet", "found": true}, {"type": "with", "string": "plays every other Sunday and they are a treat", "found": true}, {"type": "with", "string": "really good voices, and they take requests.", "found": true}, {"type": "without", "string": "Join Detroit Metro Times Newsletters", "found": false}, {"type": "without", "string": "Scroll to read more Restaurant reviews articles", "found": false}, {"type": "without", "string": "The Red Sea in Dearborn is a great catch", "found": false}]}
{"file": "gala.fr.surnom.html", "url": "https://www.gala.fr/l_actu/news_de_stars/jean-paul-delevoye-monsieur-retraites-du-gouvernement-jacques-chirac-lui-donnait-un-surnom-peu-flatteur_439447", "text_len": 2013, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Charg\u00e9 de porter la r\u00e9forme des retraites", "found": true}, {"type": "with", "string": "Chirac le surnommaitle Grand Con, parce", "found": true}, {"type": "with", "string": "un dirigeant de LREM dans un portrait", "found": true}, {"type": "without", "string": "Cr\u00e9dits photos : Bestimage", "found": true}, {"type": "without", "string": "Articles les plus lus", "found": false}, {"type": "without", "string": "L'actu", "found": false}]}
{"file": "chip.de.bestcrypt.html", "url": "https://www.chip.de/downloads/BestCrypt_13003274.html", "text_len": 2162, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "kann verschl\u00fcsselte, virtuelle Laufwerke anlegen", "found": true}, {"type": "with", "string": "Der integrierte Anti-Keylogger und", "found": true}, {"type": "with", "string": "Homepage des Herstellers nachlesen", "found": true}, {"type": "without", "string": "BestCrypt : Alternative Downloads", "found": false}, {"type": "without", "string": "UNSERE SHOPPING-GUTSCHEINE", "found": false}, {"type": "without", "string": " F\u00fcr Links auf dieser Seite erh\u00e4lt CHIP", "found": false}]}
{"file": "journals.univie.ac.at.submissions.html", "url": "https://journals.univie.ac.at/index.php/wdr/about/submissions", "text_len": 4397, "tp": 4, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "m\u00fcssen Sie registriert und eingeloggt sein.", "found": true}, {"type": "with", "string": "Soweit m\u00f6glich, wurden den Literaturangaben", "found": true}, {"type": "with", "string": "Betonungen kursiv", "found": true}, {"type": "with", "string": "Internetquellen", "found": true}, {"type": "with", "string": "wird in K\u00fcrze bereitgestellt.", "found": false}, {"type": "without", "string": "Beitragseinreichung", "found": true}, {"type": "without", "string": "Aktuelle Ausgabe", "found": false}, {"type": "without", "string": "Suchen", "found": false}]}
{"file": "rhein-neckar-loewen.de-vorverkauf.html", "url": "https://www.rhein-neckar-loewen.de/kleiner-vorverkauf-fuer-liga-heimspiele-gestartet-920981", "text_len": 1461, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "k\u00f6nnen die Rhein-Neckar L\u00f6wen lediglich", "found": true}, {"type": "with", "string": "12. Februar, 20.30 Uhr treffen die L\u00f6wen", "found": true}, {"type": "with", "string": "sollte sich die erlaubte Zuschauer-Kapazit\u00e4t", "found": true}, {"type": "without", "string": "Wenn du per E-Mail \u00fcber Aktuelles aus", "found": false}, {"type": "without", "string": "Alle News anzeigen", "found": false}, {"type": "without", "string": "Ver\u00f6ffentlichung", "found": true}]}
{"file": "gnadlib.wordpress.com.scherenschnitt.html", "url": "https://gnadlib.wordpress.com/2020/01/05/scherenschnitt-3/", "text_len": 1512, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Stadt steht schwarz", "found": true}, {"type": "with", "string": "F\u00fcr den von der Kamera", "found": true}, {"type": "with", "string": "besser geworden\u2026", "found": true}, {"type": "without", "string": "Auf gnaddrig ad libitum gibt", "found": false}, {"type": "without", "string": "Ob dieser Hinweis n\u00f6tig", "found": false}, {"type": "without", "string": "Haftungsbeschr\u00e4nkung f\u00fcr externe Links", "found": false}]}
{"file": "d90b19386e2b48559082547016cbe5ec.html", "url": "https://www.welt.de/regionales/hamburg/article202159566/Verhaertete-Fronten-nach-Tumulten-bei-Luckes-Vorlesung.html", "text_len": 3325, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der AStA (Allgemeiner Studierendenausschuss) verkl\u00e4re die Vorf\u00e4lle", "found": true}, {"type": "with", "string": "betonte, nicht zu den St\u00f6rungen im H\u00f6rsaal aufgerufen zu haben", "found": true}, {"type": "with", "string": "hie\u00df es anschlie\u00dfend.", "found": true}, {"type": "without", "string": "Lesedauer: 3 Minuten", "found": false}, {"type": "without", "string": "Vom Oma-Scho\u00dfhund zur\u00fcck zum Trend-Hund", "found": false}, {"type": "without", "string": "Newsticker", "found": false}]}
{"file": "dalloz-actualite.fr.raoult.html", "url": "https://www.dalloz-actualite.fr/node/libre-cours-raoult-nazis-et-moi", "text_len": 3475, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "C\u2019est la guerre. Et pourtant", "found": true}, {"type": "with", "string": "Vive le professeur Raoult !", "found": true}, {"type": "with", "string": "Que les magistrats sachent qu\u2019ils peuvent com", "found": true}, {"type": "without", "string": "Votre commentaire ", "found": false}, {"type": "without", "string": "otre adresse e-m", "found": false}, {"type": "without", "string": "otre no", "found": false}]}
{"file": "jagdverband.de-erschuettert.html", "url": "https://www.jagdverband.de/wir-sind-tief-erschuettert", "text_len": 1550, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "und schnelle Aufkl\u00e4rung", "found": false}, {"type": "with", "string": "niemals anonym erworben", "found": true}, {"type": "with", "string": "Sch\u00e4tzung von Experten.", "found": true}, {"type": "without", "string": "Wer wir sind und was wir tun", "found": false}, {"type": "without", "string": "(Quelle: Fleischmann/Unsplash/DJV)", "found": false}, {"type": "without", "string": "Unsere Akademie", "found": false}]}
{"file": "tierschutzpartei.de-wildvogelauffang.html", "url": "https://www.tierschutzpartei.de/eine-private-wildvogelauffang-und-auswilderungsstation/", "text_len": 3420, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dortmund-Dorstfeld jedoch anders sein", "found": true}, {"type": "with", "string": "Ewald Ferlemann und sein", "found": true}, {"type": "with", "string": "Sebastian Everding stellt nach", "found": true}, {"type": "without", "string": "8. November 2021", "found": false}, {"type": "without", "string": "Wildvogelstation Ferlemann in", "found": false}, {"type": "without", "string": "Aktuelle Wahlen", "found": false}]}
{"file": "spox.com-corona-fealle.html", "url": "https://www.spox.com/de/sport/olympia/2202/Artikel/zwei-corona-faelle-olympische-spiele-peking-eric-frenzel-terence-weber.html", "text_len": 2555, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Kombinierer waren am Tag zuvor in China", "found": true}, {"type": "with", "string": "besten sieben Athleten des Gesamtweltcups", "found": true}, {"type": "with", "string": "November im finnischen Ruka den ersten Weltcupsieg", "found": true}, {"type": "without", "string": "Die Nordischen Kombinierer Terence Weber", "found": false}, {"type": "without", "string": "Gegen Peking: Tibeter protestieren vor IOC-Hauptquartier", "found": false}, {"type": "without", "string": "Olympia 2022 - Nordische Kombination:", "found": true}]}
{"file": "lokalo.de-Weinbergsbahnen.html", "url": "https://lokalo.de/artikel/310144/weinbergsbahnen-in-erden-nicht-manipuliert-ermittlungen-zu-trittenheimer-fall-gehen-weiter/", "text_len": 965, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Vorausgegangen war ein Fall in Trittenheim", "found": true}, {"type": "with", "string": "bei dem sich ein 21-j\u00e4hriger Winzersohn", "found": true}, {"type": "with", "string": "aus dem Ort am 25.9.2023 nur durch einen beherzten Sprung retten konnte", "found": true}, {"type": "without", "string": "++ Wetter in der Region: Aussichten bis Freitag mild, aber ungem\u00fctlich ++", "found": false}, {"type": "without", "string": "FDP-Landes- und Kommunalpolitiker stellen Bundes-Ampel infrage \u2013 sieben aus RLP", "found": false}, {"type": "without", "string": "VOLKSWAGEN ZENTRUM TRIER", "found": false}]}
{"file": "wehranlage-horka.de.887.html", "url": "http://www.wehranlage-horka.de/veranstaltung/887/", "text_len": 948, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "G\u00f6rlitzer Str. 45", "found": false}, {"type": "with", "string": "W\u00e4hrend Sie \u00fcber den Markt schlendern", "found": true}, {"type": "with", "string": "Konzert bei Kerzenschein", "found": false}, {"type": "without", "string": "Infos zum Verein", "found": false}, {"type": "without", "string": "nach oben", "found": false}, {"type": "without", "string": "Datenschutzerkl\u00e4rung", "found": false}]}
{"file": "boingboing.net.millenials.html", "url": "https://boingboing.net/2013/07/19/hating-millennials-the-preju.html", "text_len": 2496, "tp": 2, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Click through for the whole thing.", "found": true}, {"type": "with", "string": "The generation we love to dump on", "found": true}, {"type": "without", "string": "GET THE BOING BOING NEWSLETTER", "found": false}, {"type": "without", "string": "happy mutants", "found": false}, {"type": "without", "string": "Patti Smith and Stewart Copeland", "found": true}]}
{"file": "0b4609a864eb4fa0bbcb2b395f6be9eb.html", "url": "https://www.ardmediathek.de/swr/player/Y3JpZDovL3N3ci5kZS9hZXgvbzExNjIyMjY/nahrungsergaenzungsmittel-das-dubiose-geschaeft-mit-der-hoffnung", "text_len": 511, "tp": 1, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dubiose H\u00e4ndler versprechen Hilfe bei Schlafst\u00f6rungen", "found": true}, {"type": "without", "string": "Navigation schliessen", "found": false}, {"type": "without", "string": "Mehr aus der Sendung", "found": false}, {"type": "without", "string": "Unfallbetr\u00fcger", "found": false}]}
{"file": "urlaubsarchitektur.de.glashaus.html", "url": "https://www.urlaubsarchitektur.de/de/das-glashaus-in-der-uckermark/ ", "text_len": 3398, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mit dem Glashaus hat der d\u00e4nische Architekt", "found": true}, {"type": "with", "string": "Das Zusammenspiel aus Holz, Glas, poliertem Estrich", "found": true}, {"type": "with", "string": "Die Fernw\u00e4rme kommt aus", "found": true}, {"type": "without", "string": "\u00dcbersichtakarte", "found": false}, {"type": "without", "string": "Lesezeichen hinzuf\u00fcgen", "found": false}, {"type": "without", "string": "weiterlesen", "found": false}]}
{"file": "elmostrador.cl-congreso.html", "url": "https://www.elmostrador.cl/destacado/2022/05/04/las-trabas-del-congreso-discusion-parlamentaria-sobre-normas-de-una-nueva-constitucion-podria-tardar-decadas/", "text_len": 11188, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "en el caso de que la opci\u00f3n Apruebo se imponga", "found": false}, {"type": "with", "string": "Lo cierto es que, para que las nuevas", "found": true}, {"type": "with", "string": "constituidos, y en particular los partidos", "found": true}, {"type": "without", "string": "Nueva Constituci\u00f3n", "found": true}, {"type": "without", "string": "Comprensi\u00f3n del Derecho", "found": false}, {"type": "without", "string": "Directora Ejecutiva de Fundaci\u00f3n", "found": false}]}
{"file": "yle.fi.3-11212601.html", "url": "https://yle.fi/uutiset/3-11212601", "text_len": 3514, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Vuodenaikojen vaihtuminen", "found": true}, {"type": "with", "string": "Ilmastonmuutos vaikuttaa terveyteen", "found": true}, {"type": "with", "string": "tuntuakin raskaalta.", "found": true}, {"type": "without", "string": "Korkeasaaren karhut", "found": true}, {"type": "without", "string": "Saat Ylen parhaat", "found": false}, {"type": "without", "string": "Wuhanilainen", "found": false}]}
{"file": "assabah.com.tn.article.html", "url": "http://www.assabah.com.tn/article/164913/%D8%A7%D9%84%D9%86%D8%A7%D8%B4%D8%B7-%D8%A7%D9%84%D8%AD%D9%82%D9%88%D9%82%D9%8A-%D8%A7%D9%84%D8%B3%D9%88%D8%AF%D8%A7%D9%86%D9%8A-%D8%AE%D8%A7%D9%84%D8%AF-%D8%B9%D8%A8%D8%AF-%D8%A7%D9%84%D9%83%D8%B1%D9%8A%D9%85-%D9%85%D8%A7%D8%B3%D8%A7-%D9%84%D9%80%C2%AB%D8%A7%D9%84%D8%B5%D8%A8%D8%A7%D8%AD%C2%BB-%D9%83%D9%84-%D8%A7%D9%84%D8%B4%D8%B1%D9%88%D8%B7-%D9%85%D8%AA%D9%88%D9%81%D8%B1%D8%A9-%D9%84%D8%AB%D9%88%D8%B1%D8%A9", "text_len": 7649, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u0645\u0646\u0630 \u0628\u062f\u0621", "found": true}, {"type": "with", "string": "\u0643\u0644 \u0627\u0644\u0645\u062c\u0627\u0644\u0627\u062a", "found": true}, {"type": "with", "string": "\u0648\u0645\u0627\u0630\u0627 \u0639\u0646 \u062d\u0642\u064a\u0642\u0629", "found": true}, {"type": "without", "string": "\u0643\u0648\u0631\u0648\u0646\u0627 \u064a\u0642\u062a\u0644", "found": false}, {"type": "without", "string": "\u063a\u0627\u0626\u0645 \u062c\u0632\u0626\u064a\u0627", "found": false}, {"type": "without", "string": "\u0625\u0636\u0627\u0641\u0629 \u062a\u0639\u0644\u064a\u0642 \u062c\u062f\u064a\u062f", "found": false}]}
{"file": "zahlenzauberin.wordpress.com.ferien.html", "url": "https://zahlenzauberin.wordpress.com/2012/08/22/was-zum-horen-in-den-ferien/", "text_len": 793, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dank Kabelanschluss kann ich", "found": true}, {"type": "with", "string": "der auch nur 20 Minuten dauert.", "found": true}, {"type": "with", "string": "Liebe zum Kind?", "found": true}, {"type": "without", "string": "Teilen Sie dies mit:", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Abgelegt unter:", "found": false}]}
{"file": "mediaarchitecture.de.weber.html", "url": "http://mediaarchitecture.de/jens-weber/", "text_len": 2724, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "1997 Medientechnik-Studium", "found": true}, {"type": "with", "string": "Umsetzung von \u00fcber 70 kommerziellen Multimediaprojekten", "found": true}, {"type": "with", "string": "Nominierung Deutscher Multimedia Award", "found": true}, {"type": "without", "string": "Alle Inhalte unterliegen", "found": false}, {"type": "without", "string": "Projekte", "found": false}]}
{"file": "lecker.de.schneewittchen.html", "url": "https://www.lecker.de/schneewittchen-kuchen-mit-mini-marshmallows-77975.html", "text_len": 2899, "tp": 6, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mini-Marshmallows getoppt wird", "found": true}, {"type": "with", "string": "Vanillepuddingpulver", "found": true}, {"type": "with", "string": "Frischhaltefolie", "found": true}, {"type": "with", "string": "300 Minuten Wartezeit", "found": true}, {"type": "with", "string": "Zum Servieren Kuchen vorsichtig", "found": true}, {"type": "with", "string": "390 kcal", "found": true}, {"type": "without", "string": "Pin it", "found": false}, {"type": "without", "string": "Versenden", "found": false}, {"type": "without", "string": "Gebratener Blumenkohlsalat", "found": false}]}
{"file": "plantcaretoday.com.bougainvillea.html", "url": "https://plantcaretoday.com/how-to-grow-and-care-for-bougainvillea.html", "text_len": 13375, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "I need some help with Bougainvillea care and watering", "found": true}, {"type": "with", "string": "In the United States, the peak blooms are typically", "found": true}, {"type": "with", "string": "Hardiest species, with somewhat furry foliage and red-purple", "found": true}, {"type": "without", "string": "Plantcaretoday.com is a participant in the Amazon Services", "found": false}, {"type": "without", "string": "Plant Care Newsletter", "found": false}, {"type": "without", "string": "Tips On Getting Rid Of Caterpillars On Roses", "found": false}]}
{"file": "uusisuomi.fi.angela.html", "url": "https://www.uusisuomi.fi/uutiset/sanna-marin-tapasi-angela-merkelin-myos-saksa-haluaa-pitaa-kiinni-maataloustuista-meidan-nakemyksiamme-suurimpana-nettomaksajana-ei-ole-otettu-riittavasti-huomioon/b29c11d3-9590-4045-8e2c-a568f9f24617", "text_len": 1562, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "ehdist\u00f6tilaisuudessa Berliiniss\u00e4.", "found": true}, {"type": "with", "string": "Merkel korosti.", "found": true}, {"type": "with", "string": "Charles Michels", "found": true}, {"type": "without", "string": "Kuva: ALEXANDER BECHER", "found": false}, {"type": "without", "string": "Brexit kasvattaa maksuja", "found": false}, {"type": "without", "string": "uudesta maahanmuuttolaista", "found": false}, {"type": "without", "string": "hiilineutraaliuteen ilman vippaskonsteja", "found": false}]}
{"file": "emacspeak.blogspot.com.meta.html", "url": "https://emacspeak.blogspot.com/2019/10/meta-programming-in-emacs-using.html", "text_len": 2095, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Decorators in Python enable you to modify", "found": true}, {"type": "with", "string": "entitled Beautiful Code, OReilly.", "found": true}, {"type": "with", "string": "Speak line moved to after next-line and", "found": false}, {"type": "without", "string": "Followers (7) ", "found": false}, {"type": "without", "string": "View my complete profile", "found": false}, {"type": "without", "string": "Simple theme. Powered by", "found": false}]}
{"file": "handwerksblatt.de-Friseurbesuch.html", "url": "https://www.handwerksblatt.de/themen-specials/coronaschutz-im-betrieb/2g-3g-was-gilt-beim-friseurbesuch", "text_len": 13806, "tp": 2, "fn": 1, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "Corona und die neue Omikron-Variante", "found": false}, {"type": "with", "string": "Besuch beim Friseur oder der Kosmetikerin", "found": true}, {"type": "with", "string": "bis einschlie\u00dflich 15 Jahren brauchen", "found": true}, {"type": "without", "string": "Alle Angaben ohne Gew\u00e4hr", "found": true}, {"type": "without", "string": "Quelle: Landesregierung", "found": true}, {"type": "without", "string": "DHB jetzt auch digital!", "found": true}]}
{"file": "malteser.de-Bev\u00f6lkerungsschutz.html", "url": "https://www.malteser.de/newsdetails/news/hilfsorganisationen-fordern-von-kuenftiger-bundesregierung-investitionsoffensive-im-bevoelkerungsschutz-1.html", "text_len": 4412, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "in den Bev\u00f6lkerungsschutz", "found": true}, {"type": "with", "string": "beh\u00f6rdlichen Strukturen und unter", "found": true}, {"type": "with", "string": "Achtung Redaktion:", "found": true}, {"type": "without", "string": "Zur\u00fcck zu allen Meldungen", "found": false}, {"type": "without", "string": "Foto: Galli/Malteser", "found": false}, {"type": "without", "string": "Jetzt helfen", "found": false}]}
{"file": "die-partei.net.luebeck.html", "url": "https://die-partei.net/luebeck/2012/05/31/das-ministerium-fur-club-kultur-informiert/", "text_len": 398, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die GEMA dreht v\u00f6llig am Zeiger!", "found": true}, {"type": "with", "string": "http://www.openpetition.de", "found": true}, {"type": "without", "string": "31. Mai", "found": false}, {"type": "without", "string": "Impressum", "found": false}, {"type": "without", "string": "Steuerdarling", "found": false}]}
{"file": "womenshealth.de.weihnachten.html", "url": "https://www.womenshealth.de/abnehmen/weihnachten-nicht-zunehmen/", "text_len": 11442, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Durchschnittlich ein Kilo mehr", "found": true}, {"type": "with", "string": "In der Folge testeten die", "found": true}, {"type": "with", "string": "Normalerweise ist es nicht ratsam", "found": true}, {"type": "without", "string": "Meist gelesen", "found": false}, {"type": "without", "string": "Abnehmen", "found": false}, {"type": "without", "string": "Zur Startseite", "found": false}]}
{"file": "makronom.de-Ressourcenschutzgesetz.html", "url": "https://makronom.de/warum-es-ein-ressourcenschutzgesetz-braucht-45273", "text_len": 9974, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es besteht ein direkter Zusammenhang", "found": true}, {"type": "with", "string": "zwischen Rohstoffnutzung und Auswirkungen", "found": true}, {"type": "with", "string": "auf den Zustand der Umwelt und \u00d6kosysteme", "found": true}, {"type": "without", "string": "MEHR ZUM THEMA", "found": false}, {"type": "without", "string": "CIRCULAR ECONOMY UND NACHHALTIGE SOZIALE MARKTWIRTSCHAFT", "found": false}, {"type": "without", "string": "Unser kostenloser Newsletter informiert Sie \u00fcber unsere neuesten Beitr\u00e4ge.", "found": false}]}
{"file": "reitschuster.de-Hass-Demo.html", "url": "https://reitschuster.de/post/tagesschau-unterschlaegt-hass-demo-in-essen/", "text_len": 4823, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Auch die Tagesschau-Verantwortlichen drehten bei", "found": true}, {"type": "with", "string": "In der 20 Uhr-Ausgabe vom Sonntagabend pr\u00e4sentierte man", "found": true}, {"type": "with", "string": "doch einen Bericht \u00fcber die Gro\u00dfdemonstration in Essen vom Vorabend", "found": true}, {"type": "without", "string": "Mein Tweet des Tages", "found": false}, {"type": "without", "string": "Meine aktuellen Videos", "found": false}, {"type": "without", "string": "Besuchen Sie unseren Fan-Shop!", "found": false}]}
{"file": "fairkom.eu.about.html", "url": "https://www.fairkom.eu/about", "text_len": 7423, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "ein gemeinwohlorientiertes Partnerschaftsnetzwerk", "found": true}, {"type": "with", "string": "Stimmberechtigung bei der Generalversammlung.", "found": true}, {"type": "without", "string": "Sicher, \u00f6kologisch und fair.", "found": false}, {"type": "without", "string": "Gemeinwohlpunkten", "found": false}]}
{"file": "tofugu.com.dezuka-suisan.html", "url": "https://www.tofugu.com/travel/dezuka-suisan/", "text_len": 4807, "tp": 4, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "We picked out a couple of", "found": true}, {"type": "with", "string": "While they were cooking", "found": true}, {"type": "with", "string": "and everything was tasty.", "found": true}, {"type": "with", "string": "+81 158-23-2012", "found": true}, {"type": "without", "string": "Abashiri Prison Museum", "found": false}, {"type": "without", "string": "885 words", "found": false}, {"type": "without", "string": "View larger map", "found": false}]}
{"file": "neues-deutschland.de.mietenstreik.html", "url": "https://www.neues-deutschland.de/artikel/1136087.mietenstreik-in-den-usa-einfach-kein-geld-mehr-um-die-miete-zu-zahlen.html", "text_len": 10929, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In den Vereinigten Staaten trommeln Aktivisten f\u00fcr einen Mietenstopp in der Coronakrise und warnen Vermieter", "found": true}, {"type": "with", "string": "gigen Mietergewerkschaft Autonomous Tenant Union (ATU) aus Chicago sagt auch", "found": true}, {"type": "with", "string": "wie Oakland oder Seattle und auch in Philadelphia haben Aktivisten", "found": true}, {"type": "without", "string": "Hat Ihnen dieser Artikel gefallen? Dann teilen Sie ihn doch mit anderen", "found": false}, {"type": "without", "string": "ptstadtregion, die sich aus der Verbreitung des Coronavirus ergeben.", "found": false}, {"type": "without", "string": "Fr\u00fcher war mehr Lametta.", "found": false}]}
{"file": "sports.fr.lorient.html", "url": "https://www.sports.fr/direct-foot/50918/177512/lorient-olympique-lyonnais.html", "text_len": 9283, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "termin\u00e9 au Moustoir ! Lorient a tenu", "found": true}, {"type": "with", "string": "Le coup de pied de coin ne donne rien.", "found": true}, {"type": "with", "string": "se cherchent en ce d\u00e9but de match.", "found": true}, {"type": "without", "string": "Ligue des Champions de la CAF", "found": false}, {"type": "without", "string": "Europa League", "found": false}, {"type": "without", "string": "Tous les sports", "found": false}]}
{"file": "ultimasnoticias.com.ve-ucraina.html", "url": "https://ultimasnoticias.com.ve/noticias/mundo/ucrania-interrumpe-paso-de-gas-ruso-a-europa-por-su-territorio/", "text_len": 1860, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "por \u00abcausas de fuerza mayor\u00bb, arguyendo", "found": true}, {"type": "with", "string": "Emmanuel Macron dijo que la entrada", "found": true}, {"type": "with", "string": "ucraniana es muy consciente de ello", "found": true}, {"type": "without", "string": "Deja un comentario", "found": false}, {"type": "without", "string": "causan m\u00e1s hambre en el mundo", "found": false}, {"type": "without", "string": "Ucrania interrumpe paso de gas ruso a Europa por su territorio", "found": false}]}
{"file": "sauvonsluniversite.com.spip.html", "url": "http://www.sauvonsluniversite.fr/spip.php?article8532", "text_len": 6773, "tp": 3, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "L\u2019AG \u00c9ducation \u00cele-de-France inter-degr\u00e9s", "found": true}, {"type": "with", "string": "Gr\u00e8ve et mobilisation pour le climat", "found": true}, {"type": "with", "string": "suivi.reformes.blanquer@gmail.com", "found": true}, {"type": "without", "string": "Sauvons l\u2019Universit\u00e9 !", "found": false}, {"type": "without", "string": "La semaine de SLU", "found": false}]}
{"file": "archive.org.muffinrezept.net.grundrezept.html", "url": "https://web.archive.org/web/20160330101229/http://muffinrezept.net/muffin-grundrezept", "text_len": 1361, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ob Schokost\u00fcckchen, Kokosraspeln, Kakaopulver, Erdbeeren, Kirschen oder anderes Obst", "found": true}, {"type": "with", "string": "bei 180 Grad auf mittlerer Schiene", "found": true}, {"type": "with", "string": "15 \u2013 30 Min", "found": false}, {"type": "without", "string": "Fluffige Himbeermuffins", "found": false}, {"type": "without", "string": "Kommentieren", "found": false}, {"type": "without", "string": "Bildquellen", "found": false}]}
{"file": "dlg.org-Preis.html", "url": "https://www.dlg.org/de/landwirtschaft/presse/aktuell#!/news/dlg-hat-wilhelm-rimpau-preis-ausgeschrieben", "text_len": 323, "tp": 0, "fn": 3, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Auszeichnung f\u00fcr innovative und praxisnahe", "found": false}, {"type": "with", "string": "Fakult\u00e4t deutschsprachiger Universit\u00e4ten", "found": false}, {"type": "with", "string": "n\u00e4chsten DLG-Feldtage, die", "found": false}, {"type": "without", "string": "Fotoarchiv", "found": false}, {"type": "without", "string": "Servicebereich Kommunikation", "found": true}, {"type": "without", "string": "14.72 KB", "found": false}]}
{"file": "standard.co.uk.caribbean.html", "url": "https://www.standard.co.uk/news/uk/turkey-poland-caribbean-islands-added-to-uk-quarantine-list-a4561256.html", "text_len": 4280, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Penalties for those who refuse to self-isolate are", "found": true}, {"type": "with", "string": "Travellers arriving in the UK from those places after", "found": true}, {"type": "with", "string": "to defend what the Government is doing", "found": true}, {"type": "without", "string": "There are no comments yet", "found": false}, {"type": "without", "string": "This is London Magazine", "found": false}, {"type": "without", "string": "Be part of the conversation", "found": false}]}
{"file": "regenbogenportal.de-intersex.html", "url": "https://www.regenbogenportal.de/aktuelles/08112021-online-fachtag-zum-intersex-day-of-remembrance", "text_len": 3388, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "digitale Veranstaltung zum Thema", "found": true}, {"type": "with", "string": "F\u00fcr inter* Personen ist es wichtig", "found": true}, {"type": "with", "string": "Familie, Senioren, Frauen und Jugend", "found": true}, {"type": "without", "string": "Newsletter abonnieren", "found": false}, {"type": "without", "string": "Online-Fachtag zum Intersex", "found": true}, {"type": "without", "string": "Anlaufstellen, Fachveranstaltungen und Materialien", "found": false}]}
{"file": "alexander-klier.net.zeitphilosophie.html", "url": "https://www.alexander-klier.net/zeitenkompetenz/zeitphilosophie/", "text_len": 2867, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es ist nicht zu wenig Zeit", "found": true}, {"type": "with", "string": "Dieses tiefsitzende Kulturmuster", "found": true}, {"type": "with", "string": "Im Rahmen des Tutzinger", "found": true}, {"type": "without", "string": "Gib Deine E-Mail-Adresse", "found": false}, {"type": "without", "string": "Diese Seite steht grunds\u00e4tzlich", "found": false}, {"type": "without", "string": "Alexander bei MOOCs \u2013 Ein Selbstversuch", "found": false}]}
{"file": "aoc.media.archaisme.html", "url": "https://aoc.media/opinion/2019/12/09/pour-le-neoliberalisme-la-retraite-est-un-archaisme/", "text_len": 1755, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Pour le n\u00e9olib\u00e9ralisme, la retraite", "found": true}, {"type": "with", "string": "les grandes gr\u00e8ves de 1995 furent", "found": true}, {"type": "with", "string": "Pour r\u00e9aliser ce programme, il impose", "found": true}, {"type": "without", "string": "Pour lire la suite", "found": true}, {"type": "without", "string": "Pour acc\u00e9der en illimit\u00e9", "found": true}, {"type": "without", "string": "Pour rester inform\u00e9 inscrivez-vous \u00e0 la newsletter", "found": false}]}
{"file": "mix1.de-clio.html", "url": "https://www.mix1.de/music/leslie-clio/brave-new-woman/", "text_len": 376, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zuvor hatte die S\u00e4ngerin und Songschreiberin", "found": true}, {"type": "with", "string": "Clio pr\u00e4sentiert das Album", "found": true}, {"type": "with", "string": "bisherigen Karriere geschrieben.", "found": true}, {"type": "without", "string": "amazon Tipp: Nutzen Sie die Musik", "found": false}, {"type": "without", "string": "Tracklist / Infos", "found": false}, {"type": "without", "string": "Sie m\u00f6chten w\u00f6chtliche Produktvorstellungen?", "found": false}]}
{"file": "knowledge-on-air.de.koa039.html", "url": "https://knowledge-on-air.de/2019/12/17/koa039-live-vom-knowledgecamp-2019/", "text_len": 413, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Auch auf dem KnowledgeCamp 2019", "found": true}, {"type": "with", "string": "vom Camp erz\u00e4hlen", "found": true}, {"type": "with", "string": "die \u00fcber ihre Eindr\u00fccke", "found": true}, {"type": "without", "string": "Scholarch der Cogneon", "found": false}, {"type": "without", "string": "Sei der Erste dem dies gef\u00e4llt", "found": false}, {"type": "without", "string": "Dieser Eintrag wurde ver\u00f6ffentlicht", "found": false}]}
{"file": "ad-magazin.de.wellness.html", "url": "https://www.ad-magazin.de/artikel/wellness-hotels", "text_len": 5730, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Diese Wellness-Hotels sind genau richtig", "found": true}, {"type": "with", "string": "Ein Infinity-Pool, ein Onsen-Pool,", "found": true}, {"type": "with", "string": "Zwei Jahre lang restaurierte Elisabeth", "found": true}, {"type": "without", "string": "Ob Chalet, \u00d6ko-Resort oder", "found": false}, {"type": "without", "string": "Tropische Reiseziele:", "found": false}, {"type": "without", "string": "Mehr von AD", "found": false}]}
{"file": "fogsmagazin.com.outdoor.html", "url": "https://fogsmagazin.com/outdoor-bekleidung/", "text_len": 5844, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Egal, ob man ein Outdoor-Fan", "found": true}, {"type": "with", "string": "Dass Outdoor-Bekleidung immer leistungsf\u00e4higer wird", "found": true}, {"type": "with", "string": "Pflegen und Reparieren", "found": true}, {"type": "without", "string": "Schlagworte:", "found": false}, {"type": "without", "string": "Immer mehr Schmucklabels setzen auf faire Produktionsbedingungen", "found": false}, {"type": "without", "string": "Alles \u00fcber nachhaltige Wanderschuhe", "found": true}]}
{"file": "hpd.de-Homosexuellenhass.html", "url": "https://hpd.de/artikel/sie-wissen-nicht-sie-tun-identitaetspolitische-linke-unterschlaegt-den-homosexuellenhass-neuer-21664", "text_len": 11436, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "die traurige Nachricht \u00fcber den Tod des Transmannes Malte C", "found": true}, {"type": "with", "string": "in Folge der Verletzungen nach einem Faustangriff", "found": true}, {"type": "with", "string": "auf der Parade des Christopher Street Days (CSD)", "found": true}, {"type": "without", "string": "Israels \u00dcberlebenskampf gegen den Terror", "found": false}, {"type": "without", "string": "Politischer Islam durch die Hintert\u00fcr", "found": false}, {"type": "without", "string": "Unterdr\u00fcckte (Homo-)Sexualit\u00e4t: Ein Risikofaktor f\u00fcr islamistische Gewalt", "found": true}]}
{"file": "literaturgefluester.wordpress.com.jahr.html", "url": "https://literaturgefluester.wordpress.com/2019/01/01/ins-neue-jahr-4/", "text_len": 7138, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Weihnachten und Silvester habe", "found": true}, {"type": "with", "string": "wahrscheinlich am Mittwoch, wenn", "found": true}, {"type": "with", "string": "in der ersten J\u00e4nnerwoche", "found": true}, {"type": "without", "string": "Einem Blogger gef\u00e4llt dies.", "found": false}, {"type": "without", "string": "Teilen Sie dies mit:", "found": false}, {"type": "without", "string": "This site uses Akismet to reduce spam", "found": false}]}
{"file": "weinlachgummis.blogspot.com.rezi.html", "url": "https://weinlachgummis.blogspot.com/2017/09/rezi-love-is-war-sehnsucht-von-r-k.html", "text_len": 3513, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir f\u00fchlten uns vereint", "found": true}, {"type": "with", "string": "Aber wieso aus Liebe Krieg", "found": true}, {"type": "with", "string": "Ich habe das Buch regelrecht verschlugen", "found": true}, {"type": "without", "string": "Ich freue mich \u00fcber eure Kommentare", "found": false}, {"type": "without", "string": "Danke f\u00fcr eure Kommentare^^", "found": false}, {"type": "without", "string": "Info zur Bewertung", "found": false}]}
{"file": "greentech.live.energiesparen bei cern.html", "url": "https://www.techfieber.de/green/2022/12/06/energiesparen-bei-cern-teilchenbeschleuniger-macht-winterpause/ ", "text_len": 4885, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Um Strom zu sparen", "found": true}, {"type": "with", "string": "Einschr\u00e4nkung ist \u00abverschmerzbar\u00bb", "found": true}, {"type": "with", "string": "Sparen durch Wartung", "found": true}, {"type": "without", "string": "Greentech.LIVE c/o Innoport RT", "found": false}, {"type": "without", "string": "Name *", "found": false}, {"type": "without", "string": "Kontakt & Impressum", "found": false}]}
{"file": "erneuerbareenergien.de.seeboden.html", "url": "https://www.erneuerbareenergien.de/technologie/offshore-wind/usa-kalifornien-verpachtet-seeboden-zur-entwicklung-von-floating-offshore-windfarmen.", "text_len": 2968, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Bei den siegreichen Bietern", "found": true}, {"type": "with", "string": "Wo die Windfarmentwickler", "found": true}, {"type": "with", "string": "Au\u00dfer in den Vereinigten Staaten", "found": true}, {"type": "without", "string": "Autoren:", "found": false}, {"type": "without", "string": "Tags", "found": false}, {"type": "without", "string": "ANMELDUNG UND REGISTRIERUNG", "found": false}]}
{"file": "chemie.de.spin-off.html", "url": "https://www.chemie.de/news/1178836/empa-spin-off-revolutioniert-die-messung-von-treibhausgasen-und-luftschadstoffen.html", "text_len": 4944, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Das im Februar 2018 als Spin-off der Empa ", "found": true}, {"type": "with", "string": "Die von Hundt und Aseev", "found": true}, {"type": "with", "string": "Und im Oktober verlieh Innosuisse", "found": true}, {"type": "without", "string": "Fakten, Hintergr\u00fcnde, Dossiers", "found": false}, {"type": "without", "string": "Start-ups", "found": true}, {"type": "without", "string": "Empa (Eidgen\u00f6ssische Materialpr\u00fcfungs- und Forschungsanstalt)", "found": false}]}
{"file": "andreabottlinger.wordpress.com.arent.html", "url": "https://andreabottlinger.wordpress.com/2019/12/26/arent-we-all/", "text_len": 1422, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es wird Zeit, dass ich", "found": true}, {"type": "with", "string": "Und damit m\u00f6chte ich auch", "found": true}, {"type": "with", "string": "Mitstreiter Bug gebastelt", "found": true}, {"type": "without", "string": "Um neue Beitr\u00e4ge per E-Mail", "found": false}, {"type": "without", "string": "Einem Blogger gef\u00e4llt dies", "found": false}, {"type": "without", "string": "Twitter hat nicht geantwortet", "found": false}]}
{"file": "financescout24.de.autokredit.html", "url": "https://www.financescout24.de/kredit/autokredit", "text_len": 27813, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Diese bringt weitere Kosten mit sich.", "found": true}, {"type": "with", "string": "hat der Finanzierer gr\u00f6\u00dfere Chancen auf eine Verg\u00fctung ohne Abschl\u00e4ge", "found": true}, {"type": "with", "string": "Wieso sind Autobank-Kredite trotz niedriger Zinsen oft teurer?", "found": true}, {"type": "without", "string": "Die Nr. 1 rund um Immobilien", "found": false}, {"type": "without", "string": "\u00a9 Copyright 2000", "found": false}, {"type": "without", "string": "Aktuelle News", "found": false}]}
{"file": "blog.amp.dev.axios.html", "url": "https://blog.amp.dev/2020/04/07/people-behind-the-code-the-axios-ascent/", "text_len": 4251, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "shift to AMP-first. We invited the duo for a chat to discover how a beta test in 2019 escalated", "found": true}, {"type": "with", "string": "Were there any challenges you had to overcome?", "found": true}, {"type": "with", "string": "color in your pencil case, you start drawing a lot quicker instead of worrying about shades", "found": true}, {"type": "without", "string": "Your email address will not be published.", "found": false}, {"type": "without", "string": "iscussions, and advanced tutorials straight to your inbox with the AMP newsletter.", "found": false}, {"type": "without", "string": "All rights reserved. The OpenJS Foundation", "found": false}]}
{"file": "nationalrail.co.uk.disruptions.html", "url": "https://www.nationalrail.co.uk/service_disruptions/245738.aspx", "text_len": 51139, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Customers with disabilities will be asked about the best", "found": true}, {"type": "with", "string": "only on longer journeys over 60 minutes", "found": true}, {"type": "with", "string": "LNER are able to carry foldable wheelchairs as", "found": true}, {"type": "without", "string": "About this site", "found": false}, {"type": "without", "string": "Rail Replacement", "found": true}, {"type": "without", "string": "You are here", "found": false}]}
{"file": "sportnews.bz-peking.html", "url": "https://www.sportnews.bz/artikel/wintersport/wintersport-mix/peking-sucht-den-superstar-7-moegliche-gesichter", "text_len": 5253, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "bereits zur j\u00fcngsten Slalom-Olympiasiegerin", "found": true}, {"type": "with", "string": "Gu gilt als Mustersch\u00fclerin, sie ist Stanford", "found": true}, {"type": "with", "string": "bisher allerdings nicht optimal gelaufen", "found": true}, {"type": "without", "string": "AFP / MARCO BERTORELLO", "found": true}, {"type": "without", "string": "So viel verdienen Lkw-Fahrer in Berlin", "found": false}, {"type": "without", "string": "Tausende Hausbesitzer", "found": false}]}
{"file": "offshore-stiftung.de.offshore-windenergie.html", "url": "https://www.offshore-stiftung.de/offshore-windenergie", "text_len": 10670, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Windparks in Nord- und Ostsee", "found": true}, {"type": "with", "string": "EXTREME BEDINGUNGEN AUF SEE", "found": false}, {"type": "with", "string": "OFFSHORE-WINDENERGIE ALS BUNDESWEITER JOBMOTOR", "found": false}, {"type": "without", "string": "VERANSTALTUNGEN", "found": false}, {"type": "without", "string": "PROJEKTE", "found": false}, {"type": "without", "string": "BLEIBEN SIE INFORMIERT", "found": false}]}
{"file": "wsvn.com-crash.html", "url": "https://wsvn.com/news/local/miami-dade/15-year-old-driver-killed-14-year-old-passenger-critical-in-sw-miami-dade-crash/", "text_len": 2475, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Investigators said a patrol unit turned on its lights", "found": false}, {"type": "with", "string": "with plans to attempt a traffic stop in the area of Southwest 118th Avenue.", "found": true}, {"type": "with", "string": "the driver lost control of the vehicle", "found": true}, {"type": "without", "string": "Join our Newsletter", "found": false}, {"type": "without", "string": "for the latest news right to your inbox", "found": false}, {"type": "without", "string": "CHILDRENS PROGRAMMING", "found": false}]}
{"file": "vegolosi.it.climate.html", "url": "https://www.vegolosi.it/news/climate-clock/", "text_len": 2999, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ce lo ripetono continuamente gli esperti che", "found": true}, {"type": "with", "string": "Ma se la nostra specie vuole sopravvivere", "found": true}, {"type": "with", "string": "A New York il Metronome si trasforma in un", "found": true}, {"type": "without", "string": "Per saperne di pi\u00f9", "found": false}, {"type": "without", "string": "Guide di base", "found": false}, {"type": "without", "string": "Frutta e verdura di stagione", "found": false}]}
{"file": "viconsortium.com-cocaine.html", "url": "https://viconsortium.com/vi-crime/virgin-islands-vessel-returning-to-puerto-rico-from-st-thomas-with-475-pounds-of-cocaine-intercepted-by-federal-agents-cbp-says", "text_len": 2119, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "U.S. Customs and Border Protection", "found": true}, {"type": "with", "string": "AMO agents requested assistance from a Puerto", "found": true}, {"type": "with", "string": "awareness in the air and maritime environments,\u201d", "found": true}, {"type": "without", "string": "phone with the VI Consortium app.", "found": false}, {"type": "without", "string": "AMO found Sunday 475 pounds of cocaine", "found": true}, {"type": "without", "string": "By U.S. CUSTOMS AND BORDER PROTECTION", "found": true}]}
{"file": "nextkabinett.wordpress.com.garden.html", "url": "https://nextkabinett.wordpress.com/2014/01/17/derek-jarman-%c2%b7-the-garden/", "text_len": 666, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The Garden \u00b7 Derek Jarman (1990)", "found": true}, {"type": "with", "string": "A nearly wordless visual narrative", "found": true}, {"type": "with", "string": "Loose in this contemporary world", "found": true}, {"type": "without", "string": "B\u00fcro der Social Secretary", "found": false}, {"type": "without", "string": "Kommentar verfassen", "found": false}, {"type": "without", "string": "@EwigeSommerzeit Danke f\u00fcr den Link", "found": false}]}
{"file": "juliasleseblog.blogspot.com.irland.html", "url": "https://juliasleseblog.blogspot.com/2018/08/irland-roadtrip.html", "text_len": 0, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "meine zweite gro\u00dfe Leidenschaft", "found": false}, {"type": "with", "string": "findet ihr darin sogar", "found": false}, {"type": "with", "string": "bei Fragen helfe ich gerne", "found": false}, {"type": "without", "string": "Gepostet vor", "found": false}, {"type": "without", "string": "Kommentar schreiben als", "found": false}, {"type": "without", "string": "Julias Lesewelt ", "found": false}]}
{"file": "ok-magazin.de.einbetoniert.html", "url": "https://www.ok-magazin.de/people/real-life/horror-fund-instagram-star-24-einbetoniert-62276.html", "text_len": 1469, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Ermittler gehen davon aus, dass der drogens\u00fcchtige Mann", "found": true}, {"type": "with", "string": "das alles w\u00e4re nur ein Traum, es tut mir so leid.", "found": true}, {"type": "with", "string": "Kaum zu fassen, dass diese Story wirklich passiert ist:", "found": true}, {"type": "without", "string": "TikTok-Star begeht", "found": false}, {"type": "without", "string": "Real Life", "found": false}, {"type": "without", "string": "Themen", "found": false}]}
{"file": "drk.de-Glasgow.html", "url": "https://www.drk.de/presse/pressemitteilungen/meldung/drk-immer-mehr-menschen-wegen-klimawandel-auf-hilfe-angewiesen/", "text_len": 2931, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": " Hitzewellen ausgesetzt gewesen", "found": true}, {"type": "with", "string": "Zudem betreibt das DRK", "found": true}, {"type": "with", "string": "Klimawandel als globale Bedrohung", "found": true}, {"type": "without", "string": "Jede kleine Spende", "found": false}, {"type": "without", "string": "Beitrag teilen", "found": false}, {"type": "without", "string": "Diese Seite:", "found": false}]}
{"file": "dhz-online.de-bewegung.html", "url": "https://www.dhz-online.de/de/news/detail/artikel/schwangere-zu-mehr-bewegung-motivieren/", "text_len": 2798, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "schlussfolgern aus ihren Daten, dass k\u00f6rperliche", "found": true}, {"type": "with", "string": "Schwangerschaft sollte gesch\u00e4rft werden.", "found": true}, {"type": "with", "string": "durchgef\u00fchrt wurden waren Bummeln", "found": true}, {"type": "without", "string": "Weitere Meldungen aus", "found": false}, {"type": "without", "string": "Alle Meldungen der Rubrik", "found": false}, {"type": "without", "string": "Sylter Hebammen-Notruf wieder erreichbar", "found": false}]}
{"file": "galore.de.buch.html", "url": "https://www.galore.de/kultur/artikel/30-11-buch-der-woche-nikole-hannah-jones-hrsg-o-1619", "text_len": 1283, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Was als Sonderausgabe der", "found": true}, {"type": "with", "string": "Die fundierten wie komplexen", "found": true}, {"type": "with", "string": "Nikole Hannah-Jones (Hrsg.)", "found": true}, {"type": "without", "string": "Abo", "found": false}, {"type": "without", "string": "Facebook", "found": false}, {"type": "without", "string": "Interviews", "found": false}]}
{"file": "d51e75d9e53a472bb7708191899aa6b4.html", "url": "https://www.ln-online.de/Lokales/Luebeck/Luebeck-So-war-die-Auktion-fuer-St.-Johannes-in-Kuecknitz", "text_len": 2456, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "wurden Dachboden-Sch\u00e4tze der Kirche St. Johannes versteigert", "found": false}, {"type": "with", "string": "Kirchenvorsteher Niels S\u00f6nnichsen hat alle Sch\u00e4tze", "found": true}, {"type": "with", "string": "Gem\u00e4lde werden hoch gehandelt", "found": true}, {"type": "without", "string": "Newsletter abonnieren", "found": false}, {"type": "without", "string": "Die Kultkneipe schlie\u00dft: Jutta's Eck", "found": false}, {"type": "without", "string": "Weitere LN+ Artikel", "found": false}]}
{"file": "jolie.de.adele.html", "url": "https://www.jolie.de/stars/adele-10-kilo-abgenommen-sie-zeigt-sich-schlanker-denn-je-200226.html", "text_len": 1354, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Adele feierte ausgelassen mit den Spice Girls", "found": true}, {"type": "with", "string": "wie sich Adele weiterentwickelt.", "found": true}, {"type": "without", "string": "Sommerzeit ist Urlaubszeit,", "found": false}, {"type": "without", "string": "Lade weitere Inhalte", "found": false}]}
{"file": "regards.fr.enquetes.html", "url": "http://www.regards.fr/politique/article/deux-ans-et-demi-en-macronie-9-mises-en-examen-10-enquetes-en-cours-et-2", "text_len": 15341, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "seule promesse du candidat Macron, la", "found": true}, {"type": "with", "string": "Le 6 ao\u00fbt 2019, le d\u00e9put\u00e9", "found": true}, {"type": "with", "string": "Anticor a port\u00e9 plainte pour", "found": true}, {"type": "without", "string": "Qui \u00eates-vous ?", "found": false}, {"type": "without", "string": "Pour cr\u00e9er des paragraphes, laissez simplement des lignes vides.", "found": false}, {"type": "without", "string": "Vos r\u00e9actions", "found": false}]}
{"file": "diy-expeditions.com.uebersee.html", "url": "http://diy-expeditions.com/expeditionen-planen/expeditionen-in-uebersee/", "text_len": 1054, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir gehen gerne mit Ihnen Ihr Expeditionskonzept durch.", "found": true}, {"type": "with", "string": "Falls Sie sich f\u00fcr ein vorgeschlagenes Reise-Paket der auf unserer News-Seite vertretenen Tour-Veranstalter entscheiden", "found": true}, {"type": "with", "string": "Sie bezahlen Ihren Guide, Transport, Unterkunft etc. vor Ort und direkt bei Ihrem von uns vermittelten Kontakt.", "found": true}, {"type": "without", "string": "Fahrzeug samt Fahrer", "found": false}, {"type": "without", "string": "Neuigkeiten aus unseren Destinationen", "found": false}, {"type": "without", "string": "y-expeditions.com. All rights reserved", "found": false}]}
{"file": "politico.com.retirement.html", "url": "https://www.politico.com/news/2019/12/30/mark-meadows-retirement-elect-wife-friend-090838", "text_len": 7478, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "shock retirement \u2014 revealed just 30 hours before the", "found": true}, {"type": "with", "string": "though he faces another stiff primary challenge next year.", "found": true}, {"type": "with", "string": "\u201cI don\u2019t expect anyone to hand me anything.", "found": true}, {"type": "without", "string": "Credit Card Payments", "found": false}, {"type": "without", "string": "Notice to California Residents", "found": false}, {"type": "without", "string": "Terms of Service", "found": false}]}
{"file": "baumev.de.Transformationslabor.html", "url": "https://www.baumev.de/News/10365/TransformationslaborErnhrung.html", "text_len": 1460, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Die Ern\u00e4hrungswirtschaft birgt", "found": true}, {"type": "with", "string": "Ausschlaggebend f\u00fcr die Initiative", "found": true}, {"type": "with", "string": "Im Fokus des Projekts steht die Frage", "found": true}, {"type": "without", "string": "Kontakt:", "found": false}, {"type": "without", "string": "Ansprechpartnerin zum", "found": true}, {"type": "without", "string": "KLIMANEUTRALIT\u00c4T VON UNTERNEHMEN", "found": true}]}
{"file": "springer.com-produkte.html", "url": "https://www.springer.com/de/acht-produkte-mit-sustainable-award-in-finance-praemiert/19837156", "text_len": 4822, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Corona-Verordnung des Landes Hessen statt.", "found": true}, {"type": "with", "string": "AG sowie die Berlin Hyp", "found": true}, {"type": "with", "string": "Wiesbaden werden Fachzeitschriften,", "found": true}, {"type": "without", "string": "Kontakt", "found": false}, {"type": "without", "string": "Logo des Sustainable Award in Finance", "found": false}, {"type": "without", "string": "Rechtliches", "found": false}]}
{"file": "hackernoon.com.scrape.html", "url": "https://hackernoon.com/how-to-scrape-google-with-python-bo7d2tal", "text_len": 2688, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "There are also some caveats", "found": true}, {"type": "with", "string": "Ever since Google Web", "found": true}, {"type": "with", "string": "Making the request is", "found": true}, {"type": "without", "string": "Hackernoon Newsletter curates", "found": false}, {"type": "without", "string": "Comments", "found": false}, {"type": "without", "string": "Creating Search Engine API", "found": false}]}
{"file": "nytimes.com.blackouts.html", "url": "https://www.nytimes.com/2020/08/16/business/california-blackouts.html", "text_len": 5231, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "As temperatures began to rise in California on", "found": true}, {"type": "with", "string": "\u201cIf there\u2019s really a problem and not just the ISO", "found": true}, {"type": "with", "string": "In particular, California ISO said two natural gas power", "found": true}, {"type": "without", "string": "Her Husband Abused Her. But Getting a Divorce Was", "found": false}, {"type": "without", "string": "Chris Rock Tried to Warn Us", "found": false}, {"type": "without", "string": "Opinion: Which Party Represents the Racial Future?", "found": false}]}
{"file": "autonews.ch-Tesla.html", "url": "https://www.autonews.ch/?p=31228", "text_len": 919, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "wieder Ger\u00fcchte zu Tesla", "found": true}, {"type": "with", "string": "Gunsten von Qingdao", "found": true}, {"type": "with", "string": "aber sicher eine vierte Gigafactory", "found": true}, {"type": "without", "string": "Volltext-Suche:", "found": false}, {"type": "without", "string": "Fahrbericht Ioniq 5 von Hyundai", "found": false}, {"type": "without", "string": "Crossback \u2013 charmant und mit", "found": false}]}
{"file": "cnet.de.schutz.html", "url": "https://www.cnet.de/88130484/so-koennen-internet-user-nach-dem-eugh-urteil-fuer-den-schutz-sensibler-daten-sorgen", "text_len": 3553, "tp": 2, "fn": 1, "fp": 1, "tn": 4, "details": [{"type": "with", "string": "liefert eine Einsch\u00e4tzung", "found": false}, {"type": "with", "string": "Auch der Verweis auf ehrverletzende Bewertungen", "found": true}, {"type": "with", "string": "Am 13. Mai 2014", "found": true}, {"type": "without", "string": "Anja Schmoll-Trautmann", "found": false}, {"type": "without", "string": "Fanden Sie diesen Artikel n\u00fctzlich?", "found": false}, {"type": "without", "string": "Aktuell", "found": false}, {"type": "without", "string": "Kommentar hinzuf\u00fcgen", "found": false}, {"type": "without", "string": "Zu seinen T\u00e4tigkeitsfeldern z\u00e4hlen", "found": true}]}
{"file": "de.globalvoices.org.nicaragua.html", "url": "https://de.globalvoices.org/2019/04/30/ein-jahr-voller-proteste-nicaraguaner-wollen-nicht-mehr-nur-den-rucktritt-ortegas-sondern-einen-neuanfang/", "text_len": 9724, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Seit dem Ausbruch der Massenproteste gegen", "found": true}, {"type": "with", "string": "Laut der niedrigsten Sch\u00e4tzung", "found": true}, {"type": "with", "string": "Ich sah, wie eine Freundin von der Universit\u00e4t", "found": true}, {"type": "without", "string": "@globalvoices verdient einen Preis f\u00fcr die", "found": false}, {"type": "without", "string": "Italiano", "found": false}, {"type": "without", "string": "Name (Pflichtfeld)", "found": false}]}
{"file": "ext.theperspective.com.items.html", "url": "https://ext.theperspective.com/items-we-never-knew-we-wanted/1/", "text_len": 20006, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "dawn of the internet brought about a lot", "found": true}, {"type": "with", "string": "to turn any laundry day into a blast", "found": true}, {"type": "with", "string": "This item is perfect for those of", "found": true}, {"type": "without", "string": "All Rights Reserved", "found": false}, {"type": "without", "string": "The Perspective Challenge", "found": false}, {"type": "without", "string": "DMCA", "found": false}]}
{"file": "forstpraxis.de.palletsauslaub.html", "url": "https://www.forstpraxis.de/pilotprojekt-heizen-mit-pellets-aus-laub-so-funktioniert-es-21677", "text_len": 2169, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In Reichenbach in der Lausitz", "found": false}, {"type": "with", "string": "Ein Antrag f\u00fcr F\u00f6rdermittel ist gestellt", "found": true}, {"type": "with", "string": "\u201eMan kann diese Pellets genauso", "found": true}, {"type": "without", "string": "AUCH INTERESSANT", "found": false}, {"type": "without", "string": "FORST&TECHNIK", "found": false}, {"type": "without", "string": "KLEINANZEIGEN", "found": false}]}
{"file": "refinery29.com.single.html", "url": "https://www.refinery29.com/de-de/single-weihnachten-fragen", "text_len": 4724, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "\u201eMeine letzte ernste Beziehung ging ", "found": true}, {"type": "with", "string": "Wenn dir Leute Fragen zum Dating", "found": true}, {"type": "with", "string": "W\u00e4hrend der Feiertage gibt es zahlreiche", "found": true}, {"type": "without", "string": "Lust auf mehr?", "found": true}, {"type": "without", "string": "The Conversation", "found": false}, {"type": "without", "string": "More from Relationships", "found": false}]}
{"file": "spreeblick.com.habeck.html", "url": "http://www.spreeblick.com/blog/2006/07/29/aus-aus-alles-vorbei-habeck-macht-die-stahnke/", "text_len": 1576, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Hunderttausende von jungen Paaren", "found": true}, {"type": "with", "string": "wie flatterhaft das M\u00e4dl ist? :)", "found": true}, {"type": "without", "string": "Malte Welding", "found": false}, {"type": "without", "string": "YouTube und die Alten", "found": false}, {"type": "without", "string": "Autokorrektur", "found": false}]}
{"file": "sheego.de.cleaning.html", "url": "https://www.sheego.de/magazin/coole-tipps/magic-cleaning/", "text_len": 16476, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Sie ist die K\u00f6nigin des Aufr\u00e4umens", "found": true}, {"type": "with", "string": "sie kommen ganz zum Schluss", "found": true}, {"type": "with", "string": "Was gibt mir ein gutes Gef\u00fchl", "found": true}, {"type": "without", "string": "15 %* Newsletter Gutschein", "found": false}, {"type": "without", "string": "Ich bin damit einverstanden", "found": false}, {"type": "without", "string": "Coole Tipps|Magic Cleaning", "found": false}]}
{"file": "uk.trustpilot.com.reviews.html", "url": "https://uk.trustpilot.com/reviews/581cf1892ae760087cadbf17", "text_len": 549, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gousto has changed my life", "found": true}, {"type": "with", "string": "What a fantastic idea!", "found": true}, {"type": "without", "string": "4 Nov 2016", "found": false}, {"type": "without", "string": "Useful", "found": false}, {"type": "without", "string": "reviews", "found": false}]}
{"file": "realsimple.com.hydrangea.html", "url": "https://www.realsimple.com/home-organizing/gardening/outdoor/hydrangea-care", "text_len": 8806, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Hydrangeas may be just about everywhere", "found": true}, {"type": "with", "string": "Make sure that the bottom of your container has holes", "found": true}, {"type": "with", "string": "1. Choose the Right Pot", "found": true}, {"type": "without", "string": "choosing your hydrangeas at the store, look for", "found": true}, {"type": "without", "string": "Fall is the time of year when root", "found": false}, {"type": "without", "string": "Sarah Yang", "found": false}]}
{"file": "zamg.ac.at-Jahresbericht.html", "url": "https://www.zamg.ac.at/cms/de/klima/news/histalp/histalp-oesterreich-jahresbericht-2021", "text_len": 995, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "zur\u00fcckreichen und besonderen", "found": true}, {"type": "with", "string": "Messwerte der Gegenwart mit", "found": true}, {"type": "with", "string": "nternationale Klimadatensammlung", "found": true}, {"type": "without", "string": "Die ZAMG ist eine", "found": false}, {"type": "without", "string": "Auskunft \u00fcber vergangenes", "found": false}, {"type": "without", "string": "Berechnung der erwartbaren", "found": false}]}
{"file": "groove.de-Anti-A100-Aktivist.html", "url": "https://groove.de/2023/10/31/anti-a100-aktivist-tobias-trommer-es-wird-an-der-zeit-dass-die-clubs-verantwortung-nehmen/", "text_len": 6956, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Treffpunkt ist Berlin-Friedrichshain", "found": true}, {"type": "with", "string": "direkt vor der Renate", "found": true}, {"type": "with", "string": "einem der f\u00fcnf Clubs, die vom Bau der A100 gef\u00e4hrdet sind", "found": true}, {"type": "without", "string": "TikTok-Techno 2.0: Ist die Blase geplatzt?", "found": false}, {"type": "without", "string": "Das Ph\u00e4nomen Stella Bossi: Ein nebul\u00f6ser Sehnsuchtsort, massentauglich gemacht", "found": false}, {"type": "without", "string": "Die Konkurrenz ist gnadenlos hart geworden", "found": false}]}
{"file": "apolut.net-Sonja-Silberhorn.html", "url": "https://apolut.net/interview-mit-schriftstellerin-sonja-silberhorn/", "text_len": 13332, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die deutsche Autorin Sonja Silberhorn", "found": true}, {"type": "with", "string": "hat die Corona-Krise und ihre gesellschaftlichen Folgen in einem Kriminalroman verarbeitet", "found": true}, {"type": "with", "string": "Den legte sie einem mittelgro\u00dfen", "found": true}, {"type": "without", "string": "Auch interessant...", "found": false}, {"type": "without", "string": "Leuchtturm ARD ORF SRG \u2013 Initiative zur Beitragsbefreiung", "found": false}, {"type": "without", "string": "Mein Leben als Monster", "found": false}]}
{"file": "beyssonmanagement.com.innovation.html", "url": "https://beyssonmanagement.com/2014/07/15/was-ist-innovation/", "text_len": 2191, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Am 14. Juni 2005 hielt Steve Jobs", "found": true}, {"type": "with", "string": "David Brier, international anerkannter", "found": true}, {"type": "with", "string": "Ein hilfreicher kleiner Film", "found": true}, {"type": "without", "string": "Bitte geben Sie Ihre E-Mail-Adresse ein", "found": false}, {"type": "without", "string": "Dieser Eintrag wurde ver\u00f6ffentlicht in", "found": false}, {"type": "without", "string": "Kommentar verfassen", "found": false}]}
{"file": "bundespraesident.de.20030331.html", "url": "https://www.bundespraesident.de/SharedDocs/Reden/DE/Johannes-Rau/Reden/2003/03/20030331_Rede2.html", "text_len": 31730, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "m Juni 1948 unternahm ein Berater des amerikanischen Milit\u00e4rgouverneurs Clay eine Rundreise durc", "found": true}, {"type": "with", "string": " vielleicht am sch\u00f6nsten mit einem Kirchenlied des Grafen Zinzendorf sagen:", "found": true}, {"type": "with", "string": "994 errechnet, dass nur sechzehn von 120 Gesetzgebungsvorhaben gestaltende ", "found": true}, {"type": "without", "string": "Diese Seite", "found": false}, {"type": "without", "string": "\u00a9 2020 Bundespr\u00e4sidialamt", "found": false}, {"type": "without", "string": "Lebenslauf", "found": false}]}
{"file": "_Ziemniaki na sz\u00f3stej, sur\u00f3wka na dziesi\u0105tej_. Jak pomaga\u0107, \u017ceby nie zaszkodzi\u0107_ [PORADNIK W PIGU\u0141CE].html", "url": "https://wiadomosci.gazeta.pl/wiadomosci/7,114883,27025667,ziemniaki-na-szostej-surowka-na-dziesiatej-jak-pomoc-zeby.html#s=BoxMMt2", "text_len": 4219, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "pom\u00f3c osobie niewidomej", "found": true}, {"type": "with", "string": "Osoby niewidome, s\u0142abowidz\u0105ce:", "found": true}, {"type": "with", "string": "mo\u017ce wypa\u015b\u0107 z w\u00f3zka.", "found": true}, {"type": "without", "string": "Agencja Gazeta", "found": true}, {"type": "without", "string": "cocopanda.pl", "found": false}, {"type": "without", "string": "Komentarze", "found": false}]}
{"file": "bauemotion.de-schneereampflicht.html", "url": "https://www.bauemotion.de/magazin/schneeraeumpflicht-das-sollten-sie-wissen/15002914/", "text_len": 2885, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Hausbesitzer sind gesetzlich dazu", "found": true}, {"type": "with", "string": "Wenn sich ein Passant auf einem", "found": true}, {"type": "with", "string": "Fitnesstraining an der frischen Luft.", "found": true}, {"type": "without", "string": "Meist gelesene Artikel", "found": false}, {"type": "without", "string": "Schneer\u00e4umpflicht - was man dar\u00fcber", "found": false}, {"type": "without", "string": "Dieser Artikel wird Ihnen pr\u00e4sentiert", "found": false}]}
{"file": "adac.de.kindersitze.html", "url": "https://www.adac.de/rund-ums-fahrzeug/tests/kindersicherheit/kindersitztest-2018/", "text_len": 4320, "tp": 5, "fn": 0, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "in punkto Sicherheit, Bedienung, Ergonomie", "found": true}, {"type": "with", "string": "Elf Modelle sind empfehlenswert", "found": true}, {"type": "with", "string": "Jan\u00e9 Koos i-Size", "found": true}, {"type": "with", "string": "Grenzwert der Richtlinie 2014/79/EU", "found": true}, {"type": "with", "string": "Besonders bei Babyschalen sollte gepr\u00fcft werden", "found": true}, {"type": "without", "string": "23.10.2018", "found": true}, {"type": "without", "string": "Rund ums Fahrzeug", "found": false}, {"type": "without", "string": "Diesel-Umtauschpr\u00e4mien", "found": false}, {"type": "without", "string": "Dieses Video wird \u00fcber YouTube", "found": false}]}
{"file": "changelog.blog.zwischenbilanz.html", "url": "https://www.changelog.blog/zwischenbilanz-jan-kegelberg-ueber-tops-und-flops-bei-der-transformation-von-sportscheck/", "text_len": 6172, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gibt es weitere Top-Ma\u00dfnahmen f\u00fcr Multi-Channel?", "found": true}, {"type": "with", "string": "Vielen Dank f\u00fcr das interessante Interview!", "found": true}, {"type": "without", "string": "Annette Henkel", "found": false}, {"type": "without", "string": "akzeptiere die Datenschutzbestimmungen", "found": false}, {"type": "without", "string": "Diese Beitr\u00e4ge solltest du nicht verpassen", "found": false}]}
{"file": "smava.de.privatkredit.html", "url": "https://www.smava.de/privatkredit/privatkredit-zinsen/", "text_len": 1335, "tp": 1, "fn": 5, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "und wie die Berechnung Ihrer Privatkredit-Zinsen erfolgt, erfahren Sie hier.", "found": false}, {"type": "with", "string": "286,35 \u20ac", "found": true}, {"type": "with", "string": "ein unbefristetes Arbeitsverh\u00e4ltnis sowie Verm\u00f6genswerte bzw. Sicherheiten", "found": false}, {"type": "with", "string": "\u00c4nderung der Zinsh\u00f6he bei Privatkrediten", "found": false}, {"type": "with", "string": "Wie wird die H\u00f6he der f\u00e4lligen Zinsen f\u00fcr meinen Privatkredit bestimmt?", "found": false}, {"type": "with", "string": "Gilt die vereinbarte Zinsbindung f\u00fcr die gesamte Kreditlaufzeit,", "found": false}, {"type": "without", "string": "Erhalten Sie kostenlos aktuelle Kredit-News und Informationen zu Sonderzins-Aktionen", "found": false}, {"type": "without", "string": "Kostenlose Beratung", "found": false}, {"type": "without", "string": "zum Kreditvergleich", "found": false}]}
{"file": "schleifen.ucoz.de.briefe.html", "url": "http://schleifen.ucoz.de/blog/briefe/2010-10-26-18", "text_len": 563, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es war gesagt,", "found": true}, {"type": "with", "string": "Jedes M\u00e4dchen tr\u00e4umt von Justin", "found": true}, {"type": "with", "string": "Symbol auf dem Finger haben", "found": true}, {"type": "without", "string": "3:59 PM", "found": false}, {"type": "without", "string": "Aufrufe:", "found": false}, {"type": "without", "string": "Kommentare insgesamt:", "found": false}]}
{"file": "rnz.de.witzel.html", "url": "https://www.rnz.de/nachrichten_artikel,-zz-dpa-Schlaglichter-Frank-Witzel-erhaelt-Deutschen-Buchpreis-2015-_arid,133484.html", "text_len": 603, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "F\u00fcr einen Roman", "found": true}, {"type": "with", "string": "Auszeichnung der Branche.", "found": true}, {"type": "without", "string": "Ihre RNZ.", "found": false}, {"type": "without", "string": "WHATSAPP", "found": false}]}
{"file": "vergleich.de.leasen.html", "url": "https://www.vergleich.de/auto-leasen-finanzieren-oder-kaufen.html", "text_len": 13716, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "welche Vor- und Nachteile es dabei gibt.", "found": true}, {"type": "with", "string": "Vorteile bei der Finanzierung \u00fcber einen Autokredit:", "found": true}, {"type": "with", "string": "Kratzer und Beulen kommen Sie teuer zu stehen.", "found": true}, {"type": "without", "string": "Zahnzusatzversicherung Vergleich", "found": false}, {"type": "without", "string": "So hoch sind die Kreditzinsen 2020", "found": false}, {"type": "without", "string": "K\u00f6nnen wir helfen?", "found": false}]}
{"file": "flowfx.de.tmux.html", "url": "https://flowfx.de/blog/copy-paste-from-tmux-to-system-clipboard/", "text_len": 510, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "or the first time in many years", "found": true}, {"type": "with", "string": "As usual, StackOverflow", "found": true}, {"type": "with", "string": "set-option -s set", "found": true}, {"type": "without", "string": "Next post", "found": false}, {"type": "without", "string": "All content is licensed", "found": false}, {"type": "without", "string": "Powered by Nikola", "found": false}]}
{"file": "papaganda.org.minions.html", "url": "http://papaganda.org/2016/04/02/minions-mit-schablonen-malen-mit-malerrolle-und-bunten-farben/", "text_len": 4751, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wochenende. Regen. Mist.", "found": true}, {"type": "with", "string": "Im Baumarkt des Misstrauens", "found": true}, {"type": "with", "string": "Papa, geh mal auf Google", "found": true}, {"type": "without", "string": "Das Internet behauptet", "found": false}, {"type": "without", "string": "2 Kommentare", "found": false}, {"type": "without", "string": "Zu faul zu tippen?", "found": false}]}
{"file": "kas.de-nordmazedonien.html", "url": "https://www.kas.de/de/laenderberichte/detail/-/content/kommunalwahlen-in-nordmazedonien", "text_len": 20397, "tp": 2, "fn": 1, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Die Lokalwahlen endeten", "found": false}, {"type": "with", "string": "Der Hauptstadt Skopje wird", "found": true}, {"type": "with", "string": "Zaev erkl\u00e4rt seinen R\u00fccktritt", "found": true}, {"type": "without", "string": "\u00dcber diese Reihe", "found": true}, {"type": "without", "string": "Die Auslandsmitarbeiter vor Ort", "found": true}, {"type": "without", "string": "Erdrutschsieg der", "found": false}]}
{"file": "finanzmarktwelt.de-Benko-Firma.html", "url": "https://finanzmarktwelt.de/signa-rene-benko-daten-berater-289554/", "text_len": 2802, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In Hamburg kommt man aktuell", "found": true}, {"type": "with", "string": "kaum an dem Thema vorbei", "found": true}, {"type": "with", "string": "Bei mehreren Prestigeprojekten", "found": true}, {"type": "without", "string": "Dax und Gold: Szenarien f\u00fcr heutiges Fed Mega-Event", "found": false}, {"type": "without", "string": "LESEN SIE AUCH", "found": false}, {"type": "without", "string": "HINTERLASSEN SIE EINE ANTWORT", "found": false}]}
{"file": "netbits.us.stunnel_rsync.html", "url": "http://www.netbits.us/docs/stunnel_rsync.html", "text_len": 25615, "tp": 3, "fn": 0, "fp": 1, "tn": 0, "details": [{"type": "with", "string": "documentation examples rely heavily on tcp-wrappers and Stunnel", "found": true}, {"type": "with", "string": "cd to the directory containing the tarball", "found": true}, {"type": "with", "string": "cert = /etc/stunnel/langly_stunnel_cert.pem", "found": true}, {"type": "without", "string": "Last Modified:", "found": true}]}
{"file": "business-punk.com.fitness.html", "url": "https://www.business-punk.com/2022/12/netflix-and-dont-chill-netflix-nimmt-fitness-reihe-ins-programm-auf/", "text_len": 0, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Insgesamt werde es \u00fcber 30", "found": false}, {"type": "with", "string": "In der ersten Staffel", "found": false}, {"type": "with", "string": "Die Kollaboration ist", "found": false}, {"type": "without", "string": "BUSINESS PUNK NEWSLETTER", "found": false}, {"type": "without", "string": "Blick ins Heft", "found": false}, {"type": "without", "string": "Mediadaten", "found": false}]}
{"file": "rete-mirabile.net.15jahre.html", "url": "https://rete-mirabile.net/notizen/15-jahre-rete-mirabile/", "text_len": 2956, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Im Trubel des Alltags", "found": true}, {"type": "with", "string": "Vor zehn Jahren war Twitter", "found": true}, {"type": "with", "string": "Aktuell fallen mir wieder mehr Themen ein", "found": true}, {"type": "without", "string": "Deine E-Mail-Adresse wird nicht ver\u00f6ffentlicht", "found": false}, {"type": "without", "string": "Logo von Jonathas Mello", "found": false}, {"type": "without", "string": "Gedanken \u00fcber Lernen und Schule", "found": false}]}
{"file": "tomshardware.com.rtx.html", "url": "https://www.tomshardware.com/uk/news/where-and-how-to-buy-rtx-3080-3090-3070", "text_len": 9101, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "RTX 3000 series graphics cards are finally", "found": true}, {"type": "with", "string": "also some aftermarket RTX 3080 cards up on", "found": true}, {"type": "with", "string": "RTX 3080 and RTX 3090 cards are", "found": true}, {"type": "without", "string": "No spam, we promise.", "found": false}, {"type": "without", "string": "More about...", "found": false}, {"type": "without", "string": "When you purchase through links on our site", "found": false}]}
{"file": "jagdleben.de-waldwege.html", "url": "https://www.jagderleben.de/news/waldwege-unrechtsmaessig-gesperrt-polizei-ermittelt-wegen-noetigung-713266", "text_len": 698, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Landwirte und Eigent\u00fcmer werden so", "found": true}, {"type": "with", "string": "Hinweise unter der", "found": true}, {"type": "without", "string": "Wer die \u00c4ste immer wieder auf", "found": false}, {"type": "without", "string": "Kommentieren Sie", "found": false}, {"type": "without", "string": "angegriffen: Polizei", "found": false}]}
{"file": "clarin.com-albertofernandez.html", "url": "https://www.clarin.com/politica/tension-alberto-fernandez-cristina-kirchner-escalo-maximo-nivel_0_h7svjXlK9z.html", "text_len": 7253, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "embestida que sum\u00f3 por estas horas", "found": true}, {"type": "with", "string": "La C\u00e1mpora en declaraciones radiales", "found": true}, {"type": "with", "string": "cuenta administrada por su", "found": true}, {"type": "without", "string": "Mir\u00e1 tambi\u00e9n", "found": false}, {"type": "without", "string": "Cristina Kirchner y Alberto Fern\u00e1ndez,", "found": true}, {"type": "without", "string": "Lo que ten\u00e9s que saber hoy", "found": false}]}
{"file": "dubisthalle.de-Intendanten-Wechsel.html", "url": "https://dubisthalle.de/intendanten-wechsel-beim-mdr", "text_len": 1822, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Von ihren 32 Jahren im MDR", "found": true}, {"type": "with", "string": "war Karola Wille 27 Jahre in leitenden Funktionen t\u00e4tig", "found": true}, {"type": "with", "string": "Im November 1991 begann sie als Referentin", "found": true}, {"type": "without", "string": "MELDUNGEN AUS DER POLITIK", "found": false}, {"type": "without", "string": "AKTUELLE POLIZEI-MELDUNGEN", "found": false}, {"type": "without", "string": "NEUESTE KOMMENTARE", "found": false}]}
{"file": "kxan.com-Voters.html", "url": "https://www.kxan.com/news/texas/voters-pass-increase-for-retired-public-education-workers-but-future-shortfalls-likely-to-emerge/", "text_len": 2403, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "So many of our retirees", "found": true}, {"type": "with", "string": "been living in this high-inflation environment", "found": true}, {"type": "with", "string": "are living on credit cards", "found": true}, {"type": "without", "string": "AUSTIN WEATHER", "found": false}, {"type": "without", "string": "TRENDING STORIES", "found": false}, {"type": "without", "string": "APD addresses Kaitlin Armstrong\u2019s online searches", "found": false}]}
{"file": "skateboardmsm.de.dormhagen.html", "url": "https://skateboardmsm.de/news/the-captains-quest-2017-contest-auf-schwimmender-miniramp-am-19-august-in-dormagen.html", "text_len": 1082, "tp": 3, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wakebeach 257", "found": true}, {"type": "with", "string": "Be there or be square!", "found": true}, {"type": "with", "string": "Hier geht\u2019s zur Facebook Veranstaltung", "found": true}, {"type": "with", "string": "Blue Tomato pr\u00e4sentiert die dritte", "found": false}, {"type": "without", "string": "More from News", "found": false}, {"type": "without", "string": "von Redaktion MSM", "found": false}, {"type": "without", "string": "add yours.", "found": false}]}
{"file": "viertausendhertz.de.ddg48.html", "url": "https://viertausendhertz.de/ddg48/", "text_len": 761, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Im Dialekt zu singen", "found": true}, {"type": "with", "string": "Mit seinen Songs \u00fcber Gl\u00fccksspiel", "found": true}, {"type": "with", "string": "Stammcaf\u00e9, Gulaschsuppe essen", "found": true}, {"type": "without", "string": "Foto: Ingo Pertramer", "found": false}, {"type": "without", "string": "Mehr Episoden anzeigen", "found": false}, {"type": "without", "string": "Mit dem Cartoonisten Tobias Vogel in Krefeld", "found": false}]}
{"file": "d73e0fa055834b2dbb2036ba27d46597.html", "url": "https://www.grazia-magazin.de/beauty/lange-haare-dank-dieser-lebensmittel-wachsen-sie-viel-schneller-43980.html", "text_len": 2964, "tp": 3, "fn": 0, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "Haare beschleunigen k\u00f6nnt?", "found": true}, {"type": "with", "string": "sowie Kalzium, Eisen, Zink und Biotin enthalten", "found": true}, {"type": "with", "string": "F\u00fcr Rapunzelhaare sorgt \u00fcbrigens auch", "found": true}, {"type": "without", "string": "Weitere Themen", "found": false}, {"type": "without", "string": "Richtig fr\u00fchst\u00fccken", "found": true}, {"type": "without", "string": "Hinweis ausblenden", "found": false}, {"type": "without", "string": "Klambt Style-Verlag GmbH & Co. KG", "found": false}]}
{"file": "lidl.de-nachhaltigkeit.html", "url": "https://www.lidl.de/c/nachhaltigkeit-im-onlineshop/s10009344", "text_len": 3873, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Wegfall des Lieferscheins und der", "found": true}, {"type": "with", "string": "geben wir an unsere Kartonagelieferanten weiter.", "found": true}, {"type": "with", "string": "unserer Kundschaft zuk\u00fcnftig die", "found": true}, {"type": "without", "string": "ZUR NACHHALTIGKEIT IM ONLINESHOP", "found": false}, {"type": "without", "string": "SCHRITT F\u00dcR SCHRITT ANLEITUNG", "found": false}, {"type": "without", "string": "Ich habe als Gast bestellt", "found": true}]}
{"file": "elpais.com.uy-gobierno.html", "url": "https://www.elpais.com.uy/informacion/sociedad/gobierno-acusa-montecon-aliarse-sindicato-fomentar-conflicto-portuario.html", "text_len": 8060, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "ahora enviar\u00eda a 125 trabajadores", "found": true}, {"type": "with", "string": "previstos para fin de mes. Horas m\u00e1s tarde", "found": true}, {"type": "with", "string": "caus\u00f3 a la firma que dirige la p\u00e9rdida de dos", "found": true}, {"type": "without", "string": "Por \u00faltimo, se ofreci\u00f3 que la ANP tome en cuenta", "found": true}, {"type": "without", "string": "LAS M\u00c1S VISTAS", "found": false}, {"type": "without", "string": "Puerto de Montevideo. Foto: Archivo", "found": false}]}
{"file": "luxuriousmagazine.com.polo.html", "url": "https://www.luxuriousmagazine.com/2019/06/royal-salute-polo-rome/", "text_len": 3035, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Argentina, the birthplace of polo.", "found": true}, {"type": "with", "string": "Simon Wittenberg travels to the Eternal City in Italy", "found": true}, {"type": "without", "string": "Luxury and lifestyle articles", "found": false}, {"type": "without", "string": "Pinterest", "found": false}]}
{"file": "d57cfadc540842ebb09971e28df123ec.html", "url": "https://www.express.de/duesseldorf/duesseldorf-tote-tauben-im-iss-dome-gefunden----peta--erstattet-strafanzeige-33335766", "text_len": 2961, "tp": 3, "fn": 0, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "Viele verenden qualvoll in den Netzen", "found": true}, {"type": "with", "string": "Das soll das Problem l\u00f6sen", "found": true}, {"type": "with", "string": "em st\u00e4dtischen Veterin\u00e4ramt umgesetzt.", "found": true}, {"type": "without", "string": "zwischen t\u00fcrkischer und kurdischer Mannschaft", "found": true}, {"type": "without", "string": "URL zum Kopieren", "found": false}, {"type": "without", "string": "Inhalt teilen", "found": false}, {"type": "without", "string": "Sei der/die Erste deiner Freunde", "found": false}]}
{"file": "tine.no.fotballskole.html", "url": "https://www.tine.no/presserom/nyhetsarkiv/nff-tine-fotballskole-viktig-for-barneidretten-gjennom-pandemien", "text_len": 3023, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "En annerledes sesong med TINE Fotballskole n\u00e6rmer seg", "found": false}, {"type": "with", "string": "TINE Fotballskole er en fantastisk og veldig", "found": true}, {"type": "with", "string": "TINE v\u00e6re med \u00e5 bidra, avslutter Syversen.", "found": true}, {"type": "without", "string": "113 Kalbakken, 0902 Oslo", "found": false}, {"type": "without", "string": "dine og tar i mot kommentarer og forslag.", "found": false}, {"type": "without", "string": "7. oktober 2020", "found": false}]}
{"file": "bundesfeuerwehrverband.at-er\u00f6ffnet.html", "url": "https://www.bundesfeuerwehrverband.at/2021/10/20/zentrum-am-berg-offiziell-eroeffnet/", "text_len": 3996, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mit mehr als vier", "found": true}, {"type": "with", "string": "Heinz Fa\u00dfmann ging auf die", "found": true}, {"type": "with", "string": "W\u00fcrdigung der \u00d6BFV-Kooperation", "found": true}, {"type": "without", "string": "Landesverb\u00e4nde", "found": false}, {"type": "without", "string": "Aktuelles aus dem \u00d6BFV", "found": false}, {"type": "without", "string": "E-LBD Krugfahrt verstorben", "found": false}]}
{"file": "journelles.de.westwing.html", "url": "https://www.journelles.de/gift-guide-westwing-22/", "text_len": 1783, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Geschenke f\u00fcr die Liebsten aussuchen,", "found": true}, {"type": "with", "string": "Buchst\u00fctzen:", "found": true}, {"type": "with", "string": "All diese sch\u00f6nen Produkte und", "found": false}, {"type": "without", "string": "Tags:", "found": false}, {"type": "without", "string": "Anzeige, enth\u00e4lt Affiliate Links", "found": true}, {"type": "without", "string": "Das ist Liebe in deinem Posteingang:", "found": false}]}
{"file": "gay.ch-papst.html", "url": "https://gay.ch/news/vatikan-eltern-sollen-queere-kinder-unterstuetzen-sagt-der-papst", "text_len": 1988, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Obwohl sich gerade viele Gl\u00e4ubige", "found": true}, {"type": "with", "string": "sorgte Papst Franzikus nun", "found": true}, {"type": "with", "string": "Der Zickzack-Kurs der Katholischen", "found": false}, {"type": "without", "string": "Weitere Artikel zum Thema:", "found": false}, {"type": "without", "string": "VATIKAN: Papst fordert", "found": false}, {"type": "without", "string": "SCHWEIZ/ DEUTSCHLAND:", "found": false}]}
{"file": "theinsidersnet.com-wellaflex.html", "url": "https://www.theinsidersnet.com/de-de/campaigns/info/55887/welladryhairspraysmf2202.htm", "text_len": 2064, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Dann haben wir genau das richtige f\u00fcr Dich!", "found": true}, {"type": "with", "string": "Du m\u00f6chtet Deinen Look nach", "found": true}, {"type": "with", "string": "Dose kr\u00e4ftig sch\u00fctteln. Spr\u00fchkopf", "found": true}, {"type": "without", "string": "Start", "found": false}, {"type": "without", "string": "das Influencer-Marketingnetzwerk", "found": false}, {"type": "without", "string": "eine Kampagne mit uns", "found": false}]}
{"file": "rosa-mag.de.womanking.html", "url": "https://rosa-mag.de/sheila-atim-the-woman-king-zeigt-weibliche-staerke-in-all-ihren-facetten/", "text_len": 8424, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Gerade ist der Hollywood Blockbuster", "found": true}, {"type": "with", "string": "Atim: The Woman King zeigt weibliche St\u00e4rke", "found": true}, {"type": "with", "string": "Die Stunt-Szenen im Film sind", "found": true}, {"type": "without", "string": "Unterst\u00fctze RosaMag ", "found": true}, {"type": "without", "string": "W\u00e4hle deine Mitgliedschaft", "found": false}, {"type": "without", "string": "RELATED POSTS", "found": false}]}
{"file": "unsere-zeitung.at.inklusion.html", "url": "https://www.unsere-zeitung.at/2020/02/02/ist-die-inklusion-im-kapitalismus-umsetzbar/", "text_len": 5062, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Soziales Netzwerk, Sozialraumorientierung, Inklusion", "found": true}, {"type": "with", "string": "Hohe Bedeutung von sozialen", "found": true}, {"type": "with", "string": "Menschen mit Behinderung, ist im Bereich", "found": true}, {"type": "without", "string": "Abonniere unseren Newsletter", "found": false}, {"type": "without", "string": "Alle Kooperationspartner von Unsere Zeitung auf einem Blick", "found": false}, {"type": "without", "string": "Verein \u201eUnsere Zeitung \u2013 Die Demokratische.\u201c", "found": false}]}
{"file": "madame.lefigaro.fr.dintestin.html", "url": "https://madame.lefigaro.fr/bien-etre/problemes-dintestin-quoi-manger-pour-aller-bien-110417-130897", "text_len": 6165, "tp": 3, "fn": 0, "fp": 1, "tn": 3, "details": [{"type": "with", "string": "Car oui, avec ses 200 millions de neurones", "found": true}, {"type": "with", "string": "Travailler son stress", "found": true}, {"type": "with", "string": "riches en pr\u00e9biotiques et en probiotiques.", "found": true}, {"type": "without", "string": "\u00c0 lire aussi", "found": true}, {"type": "without", "string": "d\u00eene tard chez soi", "found": false}, {"type": "without", "string": "Remportez le soin Time-Filler", "found": false}, {"type": "without", "string": "veuillez vous connecter", "found": false}]}
{"file": "abookshelffullofsunshine.blogspot.com.interview.html", "url": "https://abookshelffullofsunshine.blogspot.com/2013/10/news-viertes-eigenes-blog-interview.html", "text_len": 4373, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Vor einiger Zeit durfte ich \"Endless Life\"", "found": true}, {"type": "with", "string": "Am 4. Oktober kommt dein", "found": true}, {"type": "with", "string": "Freiraum f\u00fcr seine eigenen Gedanken", "found": true}, {"type": "without", "string": "Angelfall \u2013 Tage der Dunkelheit", "found": false}, {"type": "without", "string": "Kommentare:", "found": false}, {"type": "without", "string": "Ihr seid die Besten!", "found": false}]}
{"file": "deutschlandfunk.de.titanic.html", "url": "https://www.deutschlandfunk.de/die-zukunft-der-arbeit-wir-dekorieren-auf-der-titanic-die.911.de.html?dram:article_id=385022", "text_len": 32261, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Digitalisierung der Arbeitswelt werde Millionen Arbeitspl\u00e4tze kosten, auch in Deutschland.", "found": true}, {"type": "with", "string": "Das Problem ist dabei nicht das selbstfahrende", "found": true}, {"type": "with", "string": "Also ich glaube, wenn man sich", "found": true}, {"type": "without", "string": "Entdecken Sie den Deutschlandfunk", "found": false}, {"type": "without", "string": "Deutschlandradio \u00a9 2009-2020", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}]}
{"file": "plentylife.blogspot.pamela-reif.html", "url": "https://plentylife.blogspot.com/2017/05/strong-beautiful-pamela-reif-rezension.html", "text_len": 3739, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Sch\u00f6nheit kommt f\u00fcr Pamela von Innen und Au\u00dfen", "found": true}, {"type": "with", "string": "Die Workout \u00dcbungen kannte ich bereits", "found": true}, {"type": "without", "string": "Links zu diesem Post", "found": false}, {"type": "without", "string": "mehr \u00fcber mich", "found": false}, {"type": "without", "string": "Bitte beachte auch die Datenschutzerkl\u00e4rung von Google.", "found": false}]}
{"file": "stackoverflow.com.rust.html", "url": "https://stackoverflow.blog/2020/01/20/what-is-rust-and-why-is-it-so-popular/", "text_len": 11303, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Rust has been", "found": true}, {"type": "with", "string": "Going beyond technical points", "found": true}, {"type": "without", "string": "Jake is the co-founder", "found": false}, {"type": "without", "string": "What inspires someone", "found": false}, {"type": "without", "string": "Discover and share internal knowledge", "found": false}]}
{"file": "archive.ordnungsrausch.com.orga-life.html", "url": "https://web.archive.org/web/20160526181643/http://ordnungsrausch.com/orga-life-das-leben-organisieren/", "text_len": 331, "tp": 1, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wenn der Tag mal wieder zu wenige Stunden hat", "found": true}, {"type": "without", "string": "#19 Kuchen im Glas", "found": false}, {"type": "without", "string": "2016 Ordnungsrausch", "found": false}, {"type": "without", "string": "Suche", "found": false}]}
{"file": "fr.de.nordkorea.html", "url": "https://www.fr.de/politik/kim-jong-un-nordkorea-bilder-diktator-donald-trump-zr-13680734.html", "text_len": 8635, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Er sendet Gr\u00fc\u00dfe nach Nordkorea.", "found": true}, {"type": "with", "string": "wenn auch nur in der demilitarisierten Zone im Grenzgebiet und nur f\u00fcr ein paar Schritte.", "found": true}, {"type": "with", "string": "runggelenk operierte worden und deshalb wochenlang verschwunden gewesen sei", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "Abo-Service", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}]}
{"file": "uniqz.de.katzendecke.html", "url": "https://uniqz.de/produkte/katzendecke-zweilagig-mit-namen-und-main-coon/", "text_len": 593, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Lieferzeit: 15 - 21 Tag(e)", "found": false}, {"type": "with", "string": "Hochwertige Hunde- oder Katzendecke in besonders kuscheliger", "found": false}, {"type": "with", "string": "Main Coon-Stickerei", "found": false}, {"type": "without", "string": "Das Kleingedruckte", "found": false}, {"type": "without", "string": "Informationen", "found": false}, {"type": "without", "string": "Copyright / Rechte", "found": false}]}
{"file": "for-me-online.de-pubert\u00e4t.html", "url": "https://www.for-me-online.de/familie/kinder/tochter-pubertaet", "text_len": 3747, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Dann ist sie wohl in der Pubert\u00e4t!", "found": false}, {"type": "with", "string": "bei Problemen auch an andere", "found": true}, {"type": "with", "string": "Du wirst manchmal sehr", "found": true}, {"type": "without", "string": "Mehr Inspiration", "found": false}, {"type": "without", "string": "Jetzt registrieren", "found": false}, {"type": "without", "string": "erhalten Sie exklusive", "found": true}]}
{"file": "ledevoir.com.trottinettes.html", "url": "https://www.ledevoir.com/politique/montreal/573258/la-fin-des-trottinettes-en-libre-service-a-montreal", "text_len": 2021, "tp": 1, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "En raison du taux \u00e9lev\u00e9 de d\u00e9linquance", "found": true}, {"type": "with", "string": "D\u2019autres d\u00e9tails suivront.", "found": false}, {"type": "without", "string": "La GRC doit partir", "found": false}, {"type": "without", "string": "des 4 articles gratuits", "found": false}, {"type": "without", "string": "Du lundi au samedi", "found": false}]}
{"file": "d70fab3adde74d5fb63552855c981395.html", "url": "https://www.stern.de/politik/ausland/niederlage-fuer-johnson--parlament-vertagt-votum-ueber-brexit-deal-8961728.html?utm_campaign=alle&utm_medium=rss-feed&utm_source=standard", "text_len": 2928, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der Premierminister muss eine Verl\u00e4ngerung", "found": true}, {"type": "with", "string": "empfindliche Niederlage zugef\u00fcgt.", "found": true}, {"type": "with", "string": "mit knapper Mehrheit in einem Referendum f\u00fcr den Austritt", "found": true}, {"type": "without", "string": "Themen in diesem Artikel", "found": false}, {"type": "without", "string": "Video", "found": false}, {"type": "without", "string": "Drucken", "found": false}]}
{"file": "autohaus.de-skode.html", "url": "https://www.autohaus.de/nachrichten/autohersteller/skoda-der-lange-weg-zum-strom-2980654", "text_len": 4749, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "immerhin auf Platz drei", "found": true}, {"type": "with", "string": "Fuhrparks greifen zu", "found": true}, {"type": "with", "string": "Das neue Top-Modell", "found": false}, {"type": "without", "string": "Skoda: Der lange Weg zum Strom", "found": false}, {"type": "without", "string": "Familien-L\u00f6sung", "found": false}, {"type": "without", "string": "Fahrbericht BMW", "found": false}]}
{"file": "heiko-adams.de.laufen.html", "url": "http://www.heiko-adams.de/laufen-im-winter-von-baeh-zu-yeah-in-12-monaten/", "text_len": 920, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Heute, 12 Monate sp\u00e4ter,", "found": true}, {"type": "with", "string": "das gef\u00e4llt mir \ud83d\ude09", "found": true}, {"type": "without", "string": "Einfach laufen lassen", "found": false}, {"type": "without", "string": "Heiko's Activity", "found": false}]}
{"file": "doschu.com.solopreneur.html", "url": "https://www.doschu.com/2020/02/solopreneur-social-media-linkedin/", "text_len": 8627, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Einblicke und Impulse aus der Praxis", "found": true}, {"type": "with", "string": "Was ist zu beachten um sich im Business", "found": true}, {"type": "with", "string": "Ohne diesen Blog, welcher", "found": true}, {"type": "without", "string": "Like it? Share it!", "found": false}, {"type": "without", "string": "Hinterlassen Sie einen Kommentar", "found": false}, {"type": "without", "string": "Let\u2019s Talk @ Social Web", "found": false}]}
{"file": "mueritzurlauber.de.blockhaus.html", "url": "http://www.mueritzurlauber.de/blockhaus-typ-3/", "text_len": 3548, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das helle und liebevoll eingerichtete Blockhaus 1 hat", "found": true}, {"type": "with", "string": "Buchung ab 3 N\u00e4chte oder nach Absprache.", "found": true}, {"type": "with", "string": "\u00fcber die freien Termine oder nehmen einfach Kontakt zu uns auf.", "found": true}, {"type": "without", "string": "info@mueritzurlauber.de", "found": false}, {"type": "without", "string": "039931 51438", "found": false}, {"type": "without", "string": "Datenschutzerkl\u00e4rung", "found": false}]}
{"file": "eawag.ch-elektron.html", "url": "https://www.eawag.ch/de/news-agenda/news-plattform/news/auf-das-erste-elektron-kommt-es-an/", "text_len": 4657, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Reduktionsraten schwanken stark", "found": true}, {"type": "with", "string": "Meret Aeppli, die Erstautorin der Studie", "found": true}, {"type": "with", "string": "Die Studie beschreibt nur einen kleinen", "found": true}, {"type": "without", "string": "Kontakt an ETHZ", "found": false}, {"type": "without", "string": "Rund um Wurzeln, die Sauerstoff in den Boden bringen, lagert sich", "found": false}, {"type": "without", "string": "Originalpublikation", "found": true}]}
{"file": "spiegel.de.albtraum.html", "url": "https://www.spiegel.de/spiegel/print/d-161500790.html", "text_len": 15558, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Wie konnte es dazu kommen?", "found": true}, {"type": "with", "string": "Die Geschichte beginnt am 26. Oktober", "found": true}, {"type": "with", "string": "Es st\u00fctzt seine Version.", "found": true}, {"type": "without", "string": "und Vorteile sichern!", "found": false}, {"type": "without", "string": "Verschickt", "found": false}, {"type": "without", "string": "Die digitale Welt der Nachrichten.", "found": false}, {"type": "without", "string": "Vervielf\u00e4ltigung nur mit Genehmigung", "found": false}]}
{"file": "derpapierplanet.de.juni.html", "url": "https://www.derpapierplanet.de/2015/06/through-booking-glass-juni-genre.html", "text_len": 9094, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Jeder darf mit machen", "found": true}, {"type": "with", "string": "als wirklich ausgiebig Fantasy", "found": true}, {"type": "with", "string": "einem schon gewisse Bilder", "found": true}, {"type": "without", "string": "Du m\u00f6chtest gerne bei Through", "found": true}, {"type": "without", "string": "dir abgeschickten Kommentar akzeptierst", "found": true}, {"type": "without", "string": "Teilnehmende Blogs:", "found": false}]}
{"file": "1000things.at-Wellnessoasen.html", "url": "https://www.1000things.at/blog/wellnessoasen-thermen-vulkanland/", "text_len": 8206, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Wusstest ihr, dass die stressabbauende Wirkung von Thermalwasser", "found": true}, {"type": "with", "string": "im Thermen- & Vulkanland wissenschaftlich belegt ist?", "found": true}, {"type": "with", "string": "Kein Wunder also, dass schon ein paar Tage Urlaub im Winter hier die reinste Energieladung sind.", "found": true}, {"type": "without", "string": "Ein Roadtrip entlang der Route 66 im Thermen- & Vulkanland", "found": true}, {"type": "without", "string": "Herbstlicher Wochenend-Ausflug in die S\u00fcdoststeiermark", "found": true}, {"type": "without", "string": "Mehr von 1000things", "found": false}]}
{"file": "Dezubekizacja - reaktywacja. Czyli daty maj\u0105 znaczenie - Dziennik.pl.html", "url": "https://wiadomosci.dziennik.pl/polityka/artykuly/8156148,dezubekizacja-trybunal-konstytucyjny-wyrok-termin.html", "text_len": 1327, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Historia dezubekizacji przed", "found": false}, {"type": "with", "string": "12 maja. Tego", "found": true}, {"type": "with", "string": "Skar\u017c\u0105cy powo\u0142ali si\u0119", "found": true}, {"type": "without", "string": "Trybuna\u0142 Konstytucyjny", "found": false}, {"type": "without", "string": "CZYTAJ WI\u0118CEJ W", "found": false}, {"type": "without", "string": "Materia\u0142 chroniony prawem", "found": false}]}
{"file": "iass-potsdam.de.energiewende.html", "url": "https://www.iass-potsdam.de/de/forschungsbereich/energiewende-und-gesellschaftlicher-wandel ", "text_len": 3306, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Dekarbonisierung der Energieversorgung", "found": true}, {"type": "with", "string": "Vision", "found": true}, {"type": "with", "string": "Mission", "found": true}, {"type": "without", "string": "FORSCHUNGSGRUPPEN", "found": false}, {"type": "without", "string": "Weitere Beitr\u00e4ge anzeigen", "found": false}, {"type": "without", "string": "NEWSLETTER", "found": false}]}
{"file": "elcomercio.pe-kenjifujimori.html", "url": "https://elcomercio.pe/politica/justicia/kenji-fujimori-juicio-contra-excongresista-por-presunta-compra-de-votos-continuara-el-18-de-mayo-pedro-pablo-kuczynski-ppk-fiscalia-rmmn-noticia/", "text_len": 2042, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "de oficio (Milton Hinojoza y Luis Loyola)", "found": true}, {"type": "with", "string": "demostrar\u00edan que los acusados habr\u00edan", "found": true}, {"type": "with", "string": "PPK y Kenji Fujimori por", "found": true}, {"type": "without", "string": "VIDEO RECOMENDADO", "found": false}, {"type": "without", "string": "Fiscal\u00eda de la Naci\u00f3n abre investigaci\u00f3n", "found": false}, {"type": "without", "string": "Este juicio comprende tambi\u00e9n a", "found": true}]}
{"file": "kaieteurnewsonline.com-essequibo.html", "url": "https://www.kaieteurnewsonline.com/2022/05/06/essequibo-hunter-found-dead-with-gunshot-wounds/", "text_len": 4654, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "they had heard when", "found": true}, {"type": "with", "string": "Ramdehol had told them to", "found": true}, {"type": "with", "string": "was removed and taken to Suddie", "found": true}, {"type": "without", "string": "Guyanese killed", "found": false}, {"type": "without", "string": "Coalition Govt \u2018short-changed\u2019 judiciary in 2018", "found": false}, {"type": "without", "string": "Club 40overs cricket...", "found": false}]}
{"file": "meedia.de.freenet.html", "url": "https://meedia.de/2016/03/08/einstieg-ins-tv-geschaeft-wie-freenet-privatkunden-fuer-antennen-tv-in-hd-qualitaet-gewinnen-will/", "text_len": 7373, "tp": 2, "fn": 1, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Dadurch sollen Privatkunden", "found": false}, {"type": "with", "string": "Welche Werbeeinnahmen erwarten Sie hier langfristig?", "found": true}, {"type": "with", "string": "wir haben keinerlei Pl\u00e4ne, das zu ver\u00e4ndern.", "found": true}, {"type": "without", "string": "Nachrichten\u00fcberblick abonnieren", "found": false}, {"type": "without", "string": "\u00fcber alle aktuellen Entwicklungen auf dem Laufenden.", "found": false}, {"type": "without", "string": "Schlagworte", "found": false}, {"type": "without", "string": "Dauerzoff um drohenden UKW-Blackout", "found": false}]}
{"file": "lemire.me.json.html", "url": "https://lemire.me/blog/2019/08/02/json-parsing-simdjson-vs-json-for-modern-c/", "text_len": 1329, "tp": 3, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "I use a Skylake processor with GNU GCC 8.3.", "found": true}, {"type": "with", "string": "gsoc-2018", "found": true}, {"type": "with", "string": "0.091 GB/s", "found": true}, {"type": "with", "string": "version 0.2 on vcpkg.", "found": false}, {"type": "without", "string": "Leave a Reply", "found": false}, {"type": "without", "string": "Science and Technology links", "found": false}, {"type": "without", "string": "Proudly powered by WordPress", "found": false}]}
{"file": "laviedesidees.fr.evaluation.html", "url": "https://laviedesidees.fr/L-evaluation-et-les-listes-de.html", "text_len": 36333, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Depuis longtemps,", "found": true}, {"type": "with", "string": "Retour sur les revues de rang", "found": true}, {"type": "with", "string": "Quelques r\u00e9flexions", "found": true}, {"type": "without", "string": "enqu\u00eates \u00e0 propos des pratiques de publication", "found": false}, {"type": "without", "string": "Si vous souhaitez critiquer ou d\u00e9velopper cet article", "found": false}, {"type": "without", "string": "T\u00e9l\u00e9charger au format EPUB", "found": false}]}
{"file": "tour-magazin.de-unfall.html", "url": "https://www.tour-magazin.de/profisport/news/nach-unfall-auf-intensivstation-bernal-kaempft-um-karriere/a51346.html", "text_len": 2817, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Sieger der Tour de France", "found": true}, {"type": "with", "string": "Twitter und reihte sich damit", "found": true}, {"type": "with", "string": "Der Unfall erinnert an den schweren", "found": true}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "Branchen News", "found": false}, {"type": "without", "string": "Egan Bernal verl\u00e4ngert bis", "found": false}]}
{"file": "reisen-mit-dem-internet.de.emden-21416.html", "url": "https://www.reisen-mit-dem-internet.de/europa/deutschland/niedersachsen/ostfriesland/emden-21416", "text_len": 7625, "tp": 2, "fn": 1, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Emden ist vor allem in Deutschland", "found": true}, {"type": "with", "string": "Die Kunsthalle in Emden wurde 1986", "found": true}, {"type": "with", "string": "Erwachsene: 3 \u20ac (Preis 2019) ", "found": false}, {"type": "without", "string": "Quellen und Inspiration: u.a. wikipedia.org", "found": false}, {"type": "without", "string": "Infos zum Reiseziel", "found": false}]}
{"file": "Maciej Krzysztoszek rzecznik prasowy Amica mened\u017cer komunikacji zewn\u0119trznej.html", "url": "https://www.wirtualnemedia.pl/artykul/maciej-krzysztoszek-rzecznik-prasowy-amica-menedzer-komunikacji-zewnetrznej", "text_len": 1464, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "w dziale marketingu.", "found": true}, {"type": "with", "string": "Mickiewicza w Poznaniu.", "found": true}, {"type": "with", "string": "i komunikacj\u0105 wewn\u0119trzn\u0105.", "found": true}, {"type": "without", "string": "Zmiany personalne", "found": false}, {"type": "without", "string": "polecamy", "found": false}, {"type": "without", "string": "Podziel si\u0119", "found": false}]}
{"file": "mpimet.de.klimasystem.html", "url": "https://mpimet.mpg.de/kommunikation/aktuelles/single-news/neuer-blick-auf-das-blue-marble-foto-icon-simuliert-das-gekoppelte-klimasystem-mit-1-km-aufloesung.", "text_len": 8452, "tp": 2, "fn": 1, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Die fr\u00fchen 1970er Jahre werden oft", "found": false}, {"type": "with", "string": "W\u00e4hrend wir \u00fcber die Urspr\u00fcnge", "found": true}, {"type": "with", "string": "Die Daten werden mithilfe von NVIDIA", "found": true}, {"type": "without", "string": "Weitere Informationen:", "found": true}, {"type": "without", "string": "Kontakt:", "found": true}, {"type": "without", "string": "MPI Website /Kommunikation /Aktuelles /Single News", "found": false}]}
{"file": "brandeins.de.wahresIch.html", "url": "https://www.brandeins.de/magazine/brand-eins-wirtschaftsmagazin/2023/keine-panik/unser-wahres-ich", "text_len": 17686, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "brand eins: \u201eIm Grunde gut\u201c", "found": true}, {"type": "with", "string": "Sie wollen ein popul\u00e4res", "found": true}, {"type": "with", "string": "Ist das Ihr ultimatives", "found": true}, {"type": "without", "string": "Ausgabe kaufen", "found": false}, {"type": "without", "string": "Rechtliches", "found": false}, {"type": "without", "string": "\u00dcber uns", "found": false}]}
{"file": "mixed.de.vrodo.html", "url": "https://mixed.de/vrodo-deals-vr-taugliches-notebook-fuer-83215-euro-99-cent-leihfilme-bei-amazon-psvr/", "text_len": 3946, "tp": 2, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Niedlicher Roboter-Spielkamerad: Anki Cozmo", "found": true}, {"type": "with", "string": "Empfehlungen von Dennis:", "found": true}, {"type": "without", "string": "Unterst\u00fctze unsere Arbeit", "found": false}, {"type": "without", "string": "Deepfake-Hollywood", "found": false}, {"type": "without", "string": "Avengers", "found": false}, {"type": "without", "string": "Katzenschreck", "found": false}]}
{"file": "fivethirtyeight.com.endorsement.html", "url": "https://fivethirtyeight.com/features/the-2020-endorsement-race-is-getting-interesting/", "text_len": 11647, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "If you\u2019ve been following endorsements", "found": true}, {"type": "with", "string": "fter all, Biden and Sanders lead in national polls", "found": true}, {"type": "with", "string": "Perhaps these endorsements are capturing", "found": true}, {"type": "without", "string": "Perry Bacon Jr. is a senior writer for FiveThirtyEight.", "found": false}, {"type": "without", "string": "Filed under", "found": false}, {"type": "without", "string": "About Nielsen Measurement", "found": false}]}
{"file": "zoo-berlin.de-turm.html", "url": "xhttps://www.zoo-berlin.de/de/aktuelles/alle-news/artikel/der-turm-der-wuensche", "text_len": 2743, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zuk\u00fcnftig wird man bei der Ein- oder Ausfahrt", "found": false}, {"type": "with", "string": "mehr \u00fcber ihren Lebensraum im ", "found": true}, {"type": "with", "string": " pearlman Erlebnisarchitektur geplant.", "found": true}, {"type": "without", "string": "Zur\u00fcck zur \u00dcbersicht", "found": false}, {"type": "without", "string": "PRESSE-MITTEILUNG", "found": false}, {"type": "without", "string": "Jetzt Newsletter abonnieren", "found": false}]}
{"file": "holzwerken.net-Kreissaege.html", "url": "https://www.holzwerken.net/blog/dominik-ricker/perfekte-schnitte-nach-riss-an-der-kreissaege", "text_len": 2217, "tp": 1, "fn": 2, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Schnitten. Doch es geht auch einfacher...", "found": true}, {"type": "with", "string": "Ein schmales Restst\u00fcck wird am Parallelanschlag", "found": false}, {"type": "with", "string": "Bei d\u00fcnneren Plattenwerkstoffen", "found": false}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren!", "found": false}, {"type": "without", "string": "Nodus-Knoten, Besteckschrank", "found": false}, {"type": "without", "string": "Sie sind aktuell nicht eingeloggt.", "found": true}]}
{"file": "lacrux.com-mammut.html", "url": "https://www.lacrux.com/klettern/mammut-nimmt-adam-ondra-unter-vertrag/", "text_len": 1728, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Im von Adam Ondra ver\u00f6ffentlichten Video", "found": true}, {"type": "with", "string": "Black Diamond bald den R\u00fccken zu und wechselt", "found": true}, {"type": "with", "string": "kurze Sequenzen aneinandergereiht", "found": true}, {"type": "without", "string": "Gef\u00e4llt dir unser Klettermagazin?", "found": true}, {"type": "without", "string": "Das ist die deutsche", "found": false}, {"type": "without", "string": "Wetter Chironico", "found": false}]}
{"file": "bos-fahrzeuge.info-haubenfahrzeuge.html", "url": "https://bos-fahrzeuge.info/news/Die-Haubenfahrzeuge-der-Nachkriegszeit-Teil-49-223", "text_len": 49368, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "seine Fahrzeuge fuhren", "found": true}, {"type": "with", "string": "und Soldatenr\u00e4te das Werk", "found": true}, {"type": "with", "string": "Trittstufe aus \u00fcber", "found": true}, {"type": "without", "string": "St\u00f6rung bei der Suchfunktion", "found": false}, {"type": "without", "string": "Florian Neunkircher...", "found": false}, {"type": "without", "string": "von der Feuerl\u00f6schpolizei", "found": true}]}
{"file": "chefkoch.de.mandarinen.html", "url": "https://www.chefkoch.de/rezepte/607331160490733/Mandarinen-Schmand-Kuchen.html", "text_len": 1086, "tp": 4, "fn": 2, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "der cremigste Kuchen", "found": true}, {"type": "with", "string": "F\u00fcr den M\u00fcrbeteig:", "found": true}, {"type": "with", "string": "Margarine oder Butter", "found": true}, {"type": "with", "string": "Mandarine(n), je ca.", "found": true}, {"type": "with", "string": "Koch-/Backzeit ca.", "found": false}, {"type": "with", "string": "F\u00fcr eine 26er Springform.", "found": false}, {"type": "without", "string": "F\u00fcr dieses Rezept gibt es noch", "found": false}, {"type": "without", "string": "Lactose", "found": false}, {"type": "without", "string": "Tipp falls bei euch", "found": true}]}
{"file": "idw-online.de-Hybridbatterie.html", "url": "https://idw-online.de/de/news823175", "text_len": 3922, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In mikrobiellen Brennstoffzellen verstoffwechseln Bakterien", "found": true}, {"type": "with", "string": "Energietr\u00e4germolek\u00fcle und erzeugen dadurch Strom", "found": true}, {"type": "with", "string": "Wenn die Bakterien energiereiche Molek\u00fcle als Energietr\u00e4ger", "found": true}, {"type": "without", "string": "Die semantisch \u00e4hnlichsten Pressemitteilungen im idw", "found": false}, {"type": "without", "string": "TUB: Kohlendioxid als Rohstoff f\u00fcr die Umwandlung von Solarstrom in wertvolle chemische Produkte", "found": false}, {"type": "without", "string": "\u00bbStrom als Rohstoff\u00ab auf ACHEMA 2018: Gr\u00fcne Energie f\u00fcr eine nachhaltige Chemie", "found": false}]}
{"file": "stuttgart.de.html", "url": "https://www.stuttgart.de/item/show/132240/1", "text_len": 924, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Das Bohnenviertel entstand", "found": true}, {"type": "with", "string": "sich herrlich entspannen.", "found": true}, {"type": "without", "string": "N\u00fctzliche Links", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}]}
{"file": "nurmeinstandpunkt.wordpress.com.blogposting.html", "url": "https://nurmeinstandpunkt.wordpress.com/2020/01/23/blogposting-01-23-2020/", "text_len": 1239, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Pressef\u00f6rderung: Studie zweifelt an St\u00fctze vom Staat", "found": true}, {"type": "with", "string": "via netzpolitik.org", "found": true}, {"type": "with", "string": "via t3n News", "found": true}, {"type": "without", "string": "Hier k\u00f6nnte Ihre Meinung stehen", "found": false}, {"type": "without", "string": "Ein Fehler ist aufgetaucht", "found": false}, {"type": "without", "string": "Es hei\u00dft SOCIAL Media", "found": false}]}
{"file": "haufe.de-ordnungsgeld.html", "url": "https://www.haufe.de/recht/kanzleimanagement/buss-und-ordnungsgeld-gegen-anwalt-wegen-maskenverweigerung_222_560754.html", "text_len": 5452, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "auf Norderney erhielt er wegen", "found": true}, {"type": "with", "string": "Aufforderungen des Vorsitzenden zum Anlegen", "found": true}, {"type": "with", "string": "der Corona-Pandemie allgemein f\u00fcr zul\u00e4ssig", "found": true}, {"type": "without", "string": "Schlagworte zum Thema", "found": false}, {"type": "without", "string": "Produktempfehlung", "found": false}, {"type": "without", "string": "Verweigert der Anwalt die Maske,", "found": true}]}
{"file": "wiki.piratenpartei.de.stammtisch.html", "url": "https://wiki.piratenpartei.de/HE:Kassel/Stammtisch", "text_len": 550, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der n\u00e4chste Stammtisch", "found": true}, {"type": "with", "string": "Mittwoch des Monats", "found": true}, {"type": "with", "string": "Die Protokolle der Stammtische", "found": true}, {"type": "without", "string": "Diese Seite wurde zuletzt", "found": false}, {"type": "without", "string": "Werkzeuge", "found": false}, {"type": "without", "string": "Benutzerkonto erstellen", "found": false}]}
{"file": "finanztip.de.altersvorsorge.html", "url": "https://www.finanztip.de/betriebliche-altersvorsorge/", "text_len": 37453, "tp": 6, "fn": 0, "fp": 2, "tn": 3, "details": [{"type": "with", "string": "20,2 Mio.", "found": true}, {"type": "with", "string": "Altersvorsorge (bAV) versteht man den Aufbau einer Zusatzrente \u00fcber den Arbeitgeber.", "found": true}, {"type": "with", "string": "vor allem vor der Frage: Lohnt sich das f\u00fcr", "found": true}, {"type": "with", "string": "erl\u00e4utern wir diese genauer.", "found": true}, {"type": "with", "string": "So viel spart ein Durchschnittsverdiener", "found": true}, {"type": "with", "string": "Im Beispiel verliert der Durchschnittsverdiener durch die Entgeltumwandlung", "found": true}, {"type": "without", "string": "Weitere Themen", "found": true}, {"type": "without", "string": "Geld erhalten wir, wenn Sie di", "found": true}, {"type": "without", "string": "Aktuelle Ausgabe des Newsletters", "found": false}, {"type": "without", "string": "Unser Tipp: Bleiben Sie zum Thema", "found": false}, {"type": "without", "string": "05. Februar 2020 ", "found": false}]}
{"file": "auto-wirtschaft.ch-camping.html", "url": "https://auto-wirtschaft.ch/news/8950-fur-die-freiheit-auf-radern-campinglosungen-von-sortimo-am-caravan-salon", "text_len": 1486, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "An f\u00fcnf Messetagen", "found": true}, {"type": "with", "string": "Mit dem EQV stand", "found": true}, {"type": "with", "string": "Thule-Markise sowie", "found": true}, {"type": "without", "string": "Sinus 2021: Kinder und", "found": false}, {"type": "without", "string": "Immer informiert bleiben", "found": false}, {"type": "without", "string": "SHAB-Abfrage", "found": false}]}
{"file": "piratenpatei.de-Entlarvt.html", "url": "https://www.piratenpartei.de/2021/11/12/patrick-breyer-haugen-anhoerung-entlarvt-den-unwillen-der-eu-das-digitale-zeitalter-in-die-eigene-hand-zu-nehmen/", "text_len": 2335, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u201eHaugen warnt, dass Facebooks", "found": true}, {"type": "with", "string": "Die Anh\u00f6rung der Facebook-Whistleblowerin", "found": true}, {"type": "with", "string": "profitgetriebenen Konzernen anzuvertrauen", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Meinen Namen, meine E-Mail-Adresse", "found": false}, {"type": "without", "string": "Topthemen", "found": false}]}
{"file": "handball.ch-bruderduell.html", "url": "https://www.handball.ch/de/news/2022/cup-vorschau-beim-bsv-stans-freut-man-sich-auf-ein-bruderduell-und-viele-fans/", "text_len": 2529, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Ich glaube fest daran, dass wir die Halle f\u00fcllen", "found": true}, {"type": "with", "string": "spezielle Affiche. Mit Daniel", "found": true}, {"type": "with", "string": "mit Spannung erwarteten Viertelfinals HSC", "found": true}, {"type": "without", "string": "Gemeinsam den Verein", "found": false}, {"type": "without", "string": "DAS K\u00d6NNTE DICH", "found": false}, {"type": "without", "string": "HSC Kreuzlingen in die", "found": false}]}
{"file": "literaturkritik.de-Ann-Cotten.html", "url": "https://literaturkritik.de/franke-cotten-die-anleitungen-der-vorfahren,30063.html", "text_len": 7889, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es braucht ein wenig Zeit", "found": true}, {"type": "with", "string": "um sich auf diesen Text einzulassen", "found": true}, {"type": "with", "string": "Weder Lyrikband noch ethnologischer Bericht noch Erz\u00e4hlung", "found": true}, {"type": "without", "string": "Ergebnisse einer internationalen Tagung zu einem Forschungsprojekt", "found": false}, {"type": "without", "string": "\u00fcber Heimat, Raum und Emotion in der Literatur seit 1945 bis zur Gegenwart", "found": false}, {"type": "without", "string": "Ich habe die Portraits mit gro\u00dfem Vergn\u00fcgen gelesen", "found": false}]}
{"file": "2gewinnt.wordpress.com.uns.html", "url": "https://2gewinnt.wordpress.com/uber-uns/", "text_len": 2271, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "K\u00fcnstlerischer Lebenslauf", "found": true}, {"type": "with", "string": "Finalist bei der ORF-Show", "found": true}, {"type": "with", "string": "100 Folgen von", "found": true}, {"type": "without", "string": "Sei der Erste dem dies gef\u00e4llt.", "found": false}, {"type": "without", "string": "Gef\u00e4llt mir", "found": false}, {"type": "without", "string": "Gipfelpunkt der Geschmacklosigkeit", "found": false}]}
{"file": "Eurocash rusza z Innowacyjn\u0105 Platform\u0105 Handlu - Handel dystrybucja.html", "url": "https://www.portalspozywczy.pl/handel/wiadomosci/eurocash-rusza-z-innowacyjna-platforma-handlu,198264.html", "text_len": 5189, "tp": 3, "fn": 0, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "Jest to zintegrowany system", "found": true}, {"type": "with", "string": "kasowy IPH POS.", "found": true}, {"type": "with", "string": "dost\u0119p do IPH za 1 z\u0142.", "found": true}, {"type": "without", "string": "Szukasz lokalu handlowego", "found": true}, {"type": "without", "string": "Materia\u0142 chroniony prawem", "found": true}, {"type": "without", "string": "wi\u0119cej informacji:", "found": true}]}
{"file": "haustiermagazin.com-katzenspielzeug.html", "url": "https://www.haustiermagazin.com/kaufratgeber-vergleich-bestes-elektronisches-katzenspielzeug/", "text_len": 13743, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "haben uns deshalb verschiedene elektrische", "found": true}, {"type": "with", "string": "Welches Spiel zu deiner Mieze passt", "found": true}, {"type": "with", "string": "elektrisches Katzenspielzeug bereits", "found": true}, {"type": "without", "string": "TIPPS, HILFE UND SCHN\u00c4PPCHEN", "found": false}, {"type": "without", "string": "Bei den Verlinkungen handelt es sich um", "found": true}, {"type": "without", "string": "drei Kater und aktuell zwei portugiesische", "found": false}]}
{"file": "guten-tach.de-sperrung.html", "url": "https://guten-tach.de/dgb-brueckensperrung-belegt-die-versaeumnisse-der-letzten-jahre/", "text_len": 4212, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "einhergehenden katastrophalen Auswirkungen", "found": true}, {"type": "with", "string": "Ihre gemeinsame Aussage lautet:", "found": true}, {"type": "with", "string": "so die DGB-Vertreter. Auch", "found": true}, {"type": "without", "string": "HINTERLASSEN SIE EINE ANTWORT", "found": false}, {"type": "without", "string": "NOCH MEHR NEWS", "found": false}, {"type": "without", "string": "Ingo Degenhardt (DGB S\u00fcdwestfalen)", "found": false}]}
{"file": "mannschaft.com-katar.html", "url": "https://mannschaft.com/benjamin-naessler-liebe-kennt-keine-pause-gegen-homophobie-in-katar/", "text_len": 3272, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Petition heisst es: \u00abIm Winter 2022", "found": true}, {"type": "with", "string": "US-B\u00fcrger eine sechsmonatige Haftstrafe", "found": true}, {"type": "with", "string": "Organisatoren zu verteidigen und die B\u00fchne", "found": true}, {"type": "without", "string": "VIELLEICHT AUCH", "found": false}, {"type": "without", "string": "Hans und Kosh", "found": false}, {"type": "without", "string": "Coming-outs 2021", "found": false}]}
{"file": "latercera.com-laagenda.html", "url": "https://www.latercera.com/politica/noticia/la-agenda-con-que-interior-busca-contener-la-crisis-de-seguridad-y-el-dilema-del-oficialismo/DHCHJTT5TNETPCHCIYLXWMQOBA/", "text_len": 9752, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "La estrategia contempla, entre otras acciones,", "found": true}, {"type": "with", "string": "efundidos \u201csobre fortalecimiento de la persecuci\u00f3n", "found": true}, {"type": "with", "string": "Y\u00e1\u00f1ez. Y agreg\u00f3: \u201cNosotros permanentemente estamos evaluando a las autoridades", "found": true}, {"type": "without", "string": "M\u00e1s sobre La Tercera AM", "found": true}, {"type": "without", "string": "de terrenos adquiridos por celebridades", "found": false}, {"type": "without", "string": "$636 millones del cambio de mando?", "found": false}]}
{"file": "californiaglobe.com.amazon.html", "url": "https://californiaglobe.com/section-2/amazon-liable-for-defective-third-party-products-rules-ca-appelate-court/", "text_len": 7571, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The ruling has grouped Amazon with other retailers who", "found": true}, {"type": "with", "string": "provided by Lenoge for its product listing.", "found": true}, {"type": "with", "string": "case to a higher court in the near future.", "found": true}, {"type": "without", "string": "Get a weekly summary of California Globe stories:", "found": false}, {"type": "without", "string": "Follow Us", "found": false}, {"type": "without", "string": "Leave a Reply", "found": false}]}
{"file": "bmas.de-anforderungen.html", "url": "https://www.bmas.de/DE/Service/Presse/Meldungen/2022/aenderung-der-anforderungen-an-impf-und-genesenennachweisen.html", "text_len": 2702, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Das Robert-Koch-Institut (RKI) wurde beauftragt", "found": true}, {"type": "with", "string": "Anforderungen an 3G-Nachweise ggf.", "found": true}, {"type": "with", "string": "wieder den Status \"vollst\u00e4ndig geimpft\"", "found": true}, {"type": "without", "string": "FAQs Betrieblicher Infektionsschutz", "found": true}, {"type": "without", "string": "Fragen zum Thema Betrieblicher Infektionsschutz.", "found": true}, {"type": "without", "string": "NACH OBEN", "found": false}]}
{"file": "energieverbraucher.de.energie.html", "url": "https://www.energieverbraucher.de/de/preise__312/NewsDetail__18725/.", "text_len": 10923, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "(21. November 2022) Energieverbraucher erhalten", "found": true}, {"type": "with", "string": "Zwei weitere Umlagen treffen Verbraucher", "found": true}, {"type": "with", "string": "Auf Grundlage von \u00a7 3 der Allgemeinen Bedingungen", "found": true}, {"type": "without", "string": "weitere Inhalte zu \u00bbPreise\u00ab", "found": false}, {"type": "without", "string": "MITGLIED WERDEN", "found": false}, {"type": "without", "string": "\u00dcBER UNS", "found": false}]}
{"file": "minuto30-lasierra.html", "url": "https://www.minuto30.com/policia-hace-presencia-en-la-sierra/1331134/", "text_len": 1291, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Tras el anuncio del Paro armado por parte", "found": true}, {"type": "with", "string": "El Coronel, asegur\u00f3 que con ayudas", "found": true}, {"type": "with", "string": "del d\u00eda a d\u00eda, no solamente con las patrullas", "found": true}, {"type": "without", "string": "Im\u00e1genes capturadas de video", "found": false}, {"type": "without", "string": "CONTENIDO PATROCINADO", "found": false}, {"type": "without", "string": "se elevan un 583 % en el primer trimestre", "found": false}]}
{"file": "pinup-fashion.de.korsetts.html", "url": "http://pinup-fashion.de/korsetts-shops-designer-online-kaufen/", "text_len": 2894, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Korsetts sind f\u00fcr Pin Up Girls so etwas wie Wasser", "found": true}, {"type": "with", "string": "och was macht den Unterschied beim Korsettkauf", "found": true}, {"type": "with", "string": "Wem Shapewear ab sofort nicht edel", "found": false}, {"type": "without", "string": "Wer einen Rockabilly Shop oder einen", "found": false}, {"type": "without", "string": "Auf Pinup-Fashion findet man tolle Mode", "found": false}, {"type": "without", "string": "Viel Spa\u00df beim St\u00f6bern", "found": false}]}
{"file": "daheim-solar.de.batteriespeicher.html", "url": "https://daheim-solar.de/lexikon/batteriespeicher/", "text_len": 2409, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Der am h\u00e4ufigsten f\u00fcr Solarbatterien", "found": true}, {"type": "with", "string": "Dies ist vor allem im station\u00e4ren Betrieb", "found": true}, {"type": "with", "string": "Lithium-Ionen-Akkumulatoren werden", "found": true}, {"type": "without", "string": "Zur\u00fcck zum Lexikon", "found": false}, {"type": "without", "string": "Zu allen Beitr\u00e4gen", "found": false}, {"type": "without", "string": "Kontakt", "found": false}]}
{"file": "theplanetarypress.com.forestlands.html", "url": "https://www.theplanetarypress.com/2020/01/management-of-intact-forestlands-by-indigenous-peoples-key-to-protecting-climate/", "text_len": 6552, "tp": 2, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The U.N.-backed principle", "found": true}, {"type": "with", "string": "Overall, these landscapes", "found": true}, {"type": "without", "string": "Management of Intact Forestlands by Indigenous Peoples Key to Protecting Climate", "found": false}, {"type": "without", "string": "China has announced a new plan", "found": false}, {"type": "without", "string": "TPP highlights sustainable solutions", "found": false}]}
{"file": "auto.oe24.at-golfchina.html", "url": "https://auto.oe24.at/thema/vw-chef-diess-warnt-vor-tesla-und-golf-aus-china/497533355", "text_len": 3647, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Stammsitz Wolfsburg zu einem", "found": true}, {"type": "with", "string": "wieder zum Aush\u00e4ngeschild", "found": true}, {"type": "with", "string": "Warnung vor Tesla", "found": true}, {"type": "without", "string": "Auto kostenlos bewerten", "found": false}, {"type": "without", "string": "Mehr Videos", "found": false}, {"type": "without", "string": "des ET7 in Europa an.", "found": false}]}
{"file": "umweltbundesamt.de-atomkraft.html", "url": "https://www.umweltbundesamt.de/themen/eu-taxonomie-atomkraft-erdgas-sind-nicht-nachhaltig", "text_len": 4022, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Entwurf der Europ\u00e4ischen Kommission f\u00fcr einen", "found": false}, {"type": "with", "string": "denn die Entsorgung", "found": true}, {"type": "with", "string": "Energien auszubauen und Technologien", "found": true}, {"type": "without", "string": "Die Auswertung der Stimmen beansprucht einige Zeit.", "found": false}, {"type": "without", "string": "Quelle: jorisvo / Fotolia.com", "found": false}, {"type": "without", "string": "Greenwashing", "found": false}]}
{"file": "nnz-online.de-Quantensprung.html", "url": "https://nnz-online.de/news/news_lang.php?ArtNr=335853", "text_len": 9535, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gemeinsam mit Kindern der Kindertageseinrichtung", "found": true}, {"type": "with", "string": "des Jugendclubs Mitte sowie Jugendlichen des Kinder- und Jugendstadtrates", "found": true}, {"type": "with", "string": "er\u00f6ffnete Oberb\u00fcrgermeister Kai Buchmann am vergangenen Freitag", "found": true}, {"type": "without", "string": "Am meisten gelesen...", "found": false}, {"type": "without", "string": "Letzte Kommentare", "found": false}, {"type": "without", "string": "Top 10 Artikel der letzten 10 Tage als RSS", "found": false}]}
{"file": "heartlandnewsfeed.com-Christian.html", "url": "https://www.heartlandnewsfeed.com/2023/10/27/christian-county-police-blotters/", "text_len": 3420, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "A vehicle driven by Kimberly Carrell, no age or address reported", "found": true}, {"type": "with", "string": "was southbound on 1600E Road near 400N Road when a deer entered the roadway", "found": true}, {"type": "with", "string": "The vehicle was unable to avoid striking the deer", "found": true}, {"type": "without", "string": "a subsidiary partnership by Heartland Internet Media Networks", "found": false}, {"type": "without", "string": "Heartland Media Group of Central Illinois", "found": false}, {"type": "without", "string": "published by Heartland Newsfeed staff is covered by the BipCot NoGov license", "found": false}]}
{"file": "comparis.ch.autofinanzierung.html", "url": "https://www.comparis.ch/leasing/info/autofinanzierung", "text_len": 5864, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Eine h\u00e4ufig gestellte Frage: Leasing oder Autokredit?", "found": true}, {"type": "with", "string": "Total Differenz (Ersparnis beim Leasing)", "found": true}, {"type": "with", "string": "Welche Art der Autofinanzierung ideal ist", "found": true}, {"type": "without", "string": "Immer aktuell informiert \u00fcber Sparm\u00f6glichkeiten sowie Experten-Tipps", "found": false}, {"type": "without", "string": "8003 Z\u00fcrich", "found": false}, {"type": "without", "string": "Mit der Anmeldung stimme ich der Bearbeitung", "found": false}]}
{"file": "sac-cas.ch-schneesport.html", "url": "https://www.sac-cas.ch/de/umwelt/schneesport-mit-ruecksicht-auf-wildtiere-35334/", "text_len": 1577, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": " du schon einmal durch Tiefschnee gestapft bist", "found": true}, {"type": "with", "string": "Beachte Wildruhezonen und Wildschutzgebiete:", "found": true}, {"type": "with", "string": "sowie die \u00dcbernachtung geh\u00f6ren", "found": true}, {"type": "without", "string": "Verwandte Links", "found": false}, {"type": "without", "string": "Skitour im (Voll)Mondschein", "found": false}, {"type": "without", "string": "Alpentiere im Winter - Tiertafeln", "found": false}]}
{"file": "fischundfang.de-pop-ups.html", "url": "https://fischundfang.de/radical-pop-ups-und-dips/", "text_len": 568, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Kein Wunder \u2013 die Murmeln gibt", "found": true}, {"type": "with", "string": "mit denen die K\u00f6der nochmal", "found": true}, {"type": "with", "string": "Pop-Ups haben sich mittlerweile", "found": true}, {"type": "without", "string": "Radical Dips: \"Bloody Chicken\", \"Smashed Fish", "found": false}, {"type": "without", "string": "Matzes Zander Scheuche", "found": false}, {"type": "without", "string": "mit J\u00f6rg Strehlow", "found": false}]}
{"file": "weinkenner.de-st.magdalener.html", "url": "https://www.weinkenner.de/st-magdalener-rotweine-mit-eleganz-und-charakter/", "text_len": 5090, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Italiens, neben Barolo und Barbaresco", "found": true}, {"type": "with", "string": "St. Magdalener \u00fcberzeugen mit zarter Frucht", "found": true}, {"type": "with", "string": "ernatschwein, der vom Gambero", "found": true}, {"type": "without", "string": "\u00dcber den Autor", "found": false}, {"type": "without", "string": "S\u00fcdtiroler Weissweine die Geschichte schrieben", "found": false}, {"type": "without", "string": "Das ideale Universal-Weinglas", "found": false}]}
{"file": "tierwelt.ch-plez.html", "url": "https://www.tierwelt.ch/news/natur-umwelt/immer-mehr-modemarken-werden-pelzfrei-so-erkennen-sie-echtpelz-im-laden", "text_len": 3897, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Waschb\u00e4ren oder Hunde unter schlechten", "found": true}, {"type": "with", "string": "Fell aus einer Zucht oder gezieltem Wildfang", "found": true}, {"type": "with", "string": "Sind die Haarspitzen sichtbar", "found": true}, {"type": "without", "string": "\u00fcbergeben worden ist.", "found": false}, {"type": "without", "string": "Pelzdeklarationskontrolleure haben im vergangenen", "found": false}, {"type": "without", "string": "Die aktuelle Ausgabe", "found": false}]}
{"file": "boxen.de-staatsanwaltschaft.html", "url": "https://www.boxen.de/news/viviane-obenauf-staatsanwaltschaft-hat-beweise-vorgelegt-70501", "text_len": 1960, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das wurde abgelehnt, weil die Beweislage", "found": true}, {"type": "with", "string": "Chevrolet Camaro zur Tatzeit vor dem Apartment", "found": true}, {"type": "with", "string": "Tatzeit zuhause gewesen zu sein", "found": true}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Tyson Fury vs Dillian Whyte wird von", "found": false}, {"type": "without", "string": "Trevor Bryan siegt \u00fcber Jonathan Guidry", "found": false}]}
{"file": "demokratiewebstatt.at.luft.html", "url": "https://www.demokratiewebstatt.at/thema/thema-umwelt-und-klima/woher-kommt-die-dicke-luft", "text_len": 1844, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Eines der gro\u00dfen Probleme,", "found": true}, {"type": "with", "string": "Millionen Menschen fahren jeden Tag", "found": true}, {"type": "with", "string": "versteinerte Dinosaurierknochen.", "found": true}, {"type": "without", "string": "Clipdealer", "found": false}, {"type": "without", "string": "Teste dein Wissen", "found": false}, {"type": "without", "string": "Thema: Fu\u00dfball", "found": false}]}
{"file": "surfguard.wordpress.com.medien.html", "url": "https://surfguard.wordpress.com/2016/11/01/ich-las-sah-hoerte-medien-im-oktober-2016/", "text_len": 5353, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Rudy Guede seinerzeit nat\u00fcrlich wahrgenommen", "found": true}, {"type": "with", "string": "Muss man gesehen haben. Augen\u00f6ffnend.", "found": true}, {"type": "with", "string": "Eine neue Platte von Wilco also", "found": true}, {"type": "without", "string": "Diesen Artikel teilen:", "found": false}, {"type": "without", "string": "\u00c4hnliche Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Schreibe einen Kommentar: ", "found": false}]}
{"file": "healthline.com.fat.html", "url": "https://www.healthline.com/nutrition/ways-to-measure-body-fat", "text_len": 15778, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "It can be frustrating to step on the scale", "found": true}, {"type": "with", "string": "Skinfold measurements have been used to estimate", "found": true}, {"type": "with", "string": "Some methods, such as skinfold measurements, circumference", "found": true}, {"type": "without", "string": "to improve your health or lose weight, ", "found": false}, {"type": "without", "string": "\u00a9 2005-2020 Healthline Media a Red Ventures", "found": false}, {"type": "without", "string": "Filter out the noise and nurture your inbox", "found": false}]}
{"file": "Jest zgoda PE na umow\u0119 handlow\u0105 mi\u0119dzy UE a Londynem.html", "url": "https://wpolityce.pl/gospodarka/549052-jest-zgoda-pe-na-umowe-handlowa-miedzy-ue-a-londynem", "text_len": 2323, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Zgoda PE jest", "found": true}, {"type": "with", "string": "i otwiera now\u0105 er\u0119", "found": true}, {"type": "with", "string": "\u201ehistorycznym b\u0142\u0119dem\u201d", "found": true}, {"type": "without", "string": "opublikowano", "found": false}, {"type": "without", "string": "aja/PAP", "found": true}, {"type": "without", "string": "Czekamy na Wasze", "found": false}]}
{"file": "dw.com-elephants.html", "url": "https://www.dw.com/fr/la-perte-des-terres-fertiles-et-les-%C3%A9l%C3%A9phants-en-guin%C3%A9e-conakry/a-6533123", "text_len": 265, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "24 milliards de tonnes", "found": true}, {"type": "with", "string": "d\u00e9veloppement, IRD \u00e0 Dakar.", "found": true}, {"type": "with", "string": "d'une \u00e9tude men\u00e9e", "found": true}, {"type": "without", "string": "et vid\u00e9os sur le sujet", "found": false}, {"type": "without", "string": "terres fertiles et les \u00e9l\u00e9phants en Guin\u00e9e-Conakry", "found": false}, {"type": "without", "string": "Permalien", "found": false}]}
{"file": "orsted.de.gruener-Wasserstoff.html", "url": "https://orsted.de/gruene-energie/gruener-wasserstoff/potenzial", "text_len": 4063, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Das \u201eerneuerbare Molek\u00fcl\u201c:", "found": false}, {"type": "with", "string": "Wasserstoff als Energietr\u00e4ger", "found": true}, {"type": "with", "string": "E-Fuels als L\u00f6sung", "found": true}, {"type": "without", "string": "Folgen Sie uns auf", "found": false}, {"type": "without", "string": "\u00d8rsted glaubt an eine Welt", "found": false}, {"type": "without", "string": "Home", "found": false}]}
{"file": "uncutnews.ch-ID-Diktat.html", "url": "https://uncutnews.ch/digitale-id-diktat-un-und-gates-stiftung-setzen-auf-totale-kontrolle/", "text_len": 2954, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Im besten Fall sollen DPIs die Entwicklung auf vielf\u00e4ltige Weise f\u00f6rdern", "found": true}, {"type": "with", "string": "Kritiker, die jedoch hinter die Fassade aus Plattit\u00fcden", "found": true}, {"type": "with", "string": "entlarven den Begriff und die dahinterstehende Politik als Vorwand", "found": true}, {"type": "without", "string": "UNMANIPULIERTE & FREIE MEDIEN", "found": false}, {"type": "without", "string": "Wir werden nicht von Vereinen, Verb\u00e4nden, Parteien oder sonstigen Lobbygruppen unterst\u00fctzt.", "found": false}, {"type": "without", "string": "Wir schalten keine Werbung, wir bel\u00e4stigen auch nicht mit l\u00e4stigen Pop-ups oder n\u00f6tigen unsere Besucher", "found": false}]}
{"file": "careelite.de-flaechenverbrauch.html", "url": "https://www.careelite.de/flaechenverbrauch-fuer-fleisch/", "text_len": 0, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Du willst mehr \u00fcber den Fl\u00e4chenverbrauch f\u00fcr Fleisch,", "found": false}, {"type": "with", "string": "dessen Entwicklung vermitteln:", "found": false}, {"type": "with", "string": "Eine bemerkenswerte Statistik macht besonders", "found": false}, {"type": "without", "string": "Quellenangaben:", "found": false}, {"type": "without", "string": "richtig! Die Aufmerksamkeit", "found": false}, {"type": "without", "string": "NEUESTE BEITR\u00c4GE.", "found": false}]}
{"file": "report24.news-Drohne.html", "url": "https://report24.news/so-nah-kam-eine-iranische-drohne-einem-us-flugzeugtraeger/", "text_len": 1184, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wie das nachfolgende auf X verbreitete", "found": true}, {"type": "with", "string": "Video der iranischen Nachrichtenagentur", "found": true}, {"type": "with", "string": "Tasnim News verdeutlicht", "found": true}, {"type": "without", "string": "Neueste Artikel", "found": false}, {"type": "without", "string": "EHRUNG F\u00dcR WIDERST\u00c4NDIGE - JETZT BESTELLEN!", "found": false}, {"type": "without", "string": "JETZT VORSORGEN - SPAREN SIE BIS ZU 500 EURO!", "found": false}]}
{"file": "brigitte.de.ikigai.html", "url": "https://www.brigitte.de/liebe/persoenlichkeit/ikigai-macht-dich-sofort-gluecklicher--10972896.html", "text_len": 3000, "tp": 4, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gl\u00fccks-Trend Konkurrenz", "found": true}, {"type": "with", "string": "Praktiziere Dankbarkeit", "found": true}, {"type": "with", "string": "dein Ikigai schon gefunden?", "found": true}, {"type": "with", "string": "14,90 Euro.", "found": true}, {"type": "without", "string": "Neu in Liebe", "found": false}, {"type": "without", "string": "Erfahre mehr", "found": false}, {"type": "without", "string": "Erfahrung mit privater Arbeitsvermittlung?", "found": false}]}
{"file": "brandenburg.de.homo-brandenburgensis.html", "url": "https://www.politische-bildung-brandenburg.de/themen/land-und-leute/homo-brandenburgensis", "text_len": 11496, "tp": 3, "fn": 0, "fp": 0, "tn": 5, "details": [{"type": "with", "string": "Stilles Rackern, statt lautem Deklamieren.", "found": true}, {"type": "with", "string": "Watt jibt\u2019s n hier zu lachen?", "found": true}, {"type": "with", "string": "Das Brandenbuch. Ein Land in Stichworten.", "found": true}, {"type": "without", "string": "B\u00fcrgerbeteiligung", "found": false}, {"type": "without", "string": "Anmelden", "found": false}, {"type": "without", "string": "Foto: Timur", "found": false}, {"type": "without", "string": "Schlagworte", "found": false}, {"type": "without", "string": "Zeilenumbr\u00fcche und Abs\u00e4tze werden automatisch erzeugt.", "found": false}]}
{"file": "denkmalpraxismoderne.de.studentendorf.html", "url": "https://denkmalpraxismoderne.de/studentendorf-schlachtensee-berlin/", "text_len": 2324, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Freie Universit\u00e4t Berlin, Land Berlin", "found": true}, {"type": "with", "string": "Erster Bauabschnitt: 21 ein- bis dreigeschossige", "found": true}, {"type": "with", "string": "Erstellung eines Parkpflegewerks von Uwe", "found": true}, {"type": "without", "string": "W\u00fcstenrot Stiftung", "found": true}, {"type": "without", "string": "Kanzlerbungalow Bonn", "found": false}, {"type": "without", "string": "Alle Sanierungsbeispiele", "found": false}]}
{"file": "giga.de.chrome.html", "url": "https://www.giga.de/downloads/google-chrome/tipps/google-chrome-exportieren-alle-daten-sichern-und-nichts-mehr-verlieren/", "text_len": 3217, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Es gibt zwei Methoden, mit denen ihr Google Chrome", "found": true}, {"type": "with", "string": "Google Chrome speichert alle benutzerrelevanten Daten,", "found": true}, {"type": "with", "string": "funktioniert - in eingeschr\u00e4nktem Ma\u00dfe - nat\u00fcrlich auch auf", "found": true}, {"type": "without", "string": "F\u00fcr Links auf dieser Seite erh\u00e4lt GIGA", "found": false}, {"type": "without", "string": "oder blauer Unterstreichung gekennzeichnete. Mehr Infos.", "found": false}, {"type": "without", "string": "Alle Rechte vorbehalten.", "found": false}]}
{"file": "spoe.at-mieterh\u00f6hung.html", "url": "https://www.spoe.at/2022/02/04/automatische-mieterhoehung-verhindern/", "text_len": 2827, "tp": 3, "fn": 0, "fp": 3, "tn": 0, "details": [{"type": "with", "string": "April zus\u00e4tzlich aufgrund einer", "found": true}, {"type": "with", "string": "das sind pro Jahr \u00fcber 500 Euro an Mehrkosten", "found": true}, {"type": "with", "string": "Wohnverh\u00e4ltnisse sollen als Ausnahme", "found": true}, {"type": "without", "string": "Wohnen", "found": true}, {"type": "without", "string": "nicht noch zus\u00e4tzlich", "found": true}, {"type": "without", "string": "Preise f\u00fcr das t\u00e4gliche", "found": true}]}
{"file": "Solarserver.de.solarthermisches kraftwerk dubai.html", "url": "https://www.solarserver.de/2022/12/01/groesstes-solarthermisches-kraftwerk-der-welt-entsteht-in-dubai/ ", "text_len": 2132, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Shanghai Electric baut", "found": false}, {"type": "with", "string": "Die PV-Module mit insgesamt 250", "found": true}, {"type": "with", "string": "F\u00fcr das Projekt werden etwa 560.000 Tonnen", "found": true}, {"type": "without", "string": "Solarserver Newsletter", "found": false}, {"type": "without", "string": "Solarserver Stellenmarkt", "found": false}, {"type": "without", "string": "teilen twittern E-Mail", "found": false}]}
{"file": "aussengedanken.de.feuerholz.html", "url": "http://www.aussengedanken.de/streit-ums-feuerholz/", "text_len": 8338, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Nur eine kurze Sandpiste", "found": true}, {"type": "with", "string": "Und nicht nur sie. Einige Hundert Kilometer", "found": true}, {"type": "with", "string": "Immerhin 1,6 Millionen Euro Hilfsgelder", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Lars Bauer (links im Bild) und Jens", "found": false}, {"type": "without", "string": "Unterst\u00fctzen Sie uns", "found": false}]}
{"file": "nature.com.telescope.html", "url": "https://www.nature.com/articles/d41586-019-02790-3", "text_len": 5814, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Since testing began", "found": true}, {"type": "with", "string": "Eye in the sky", "found": true}, {"type": "with", "string": "Li hopes that", "found": true}, {"type": "without", "string": "You are using a browser version", "found": false}, {"type": "without", "string": "PDF version", "found": false}, {"type": "without", "string": "Latest on:", "found": false}, {"type": "without", "string": "I agree my information will be", "found": false}]}
{"file": "handelsblatt.com.grenzschliessungen.html", "url": "https://www.handelsblatt.com/politik/international/grenzschliessungen-report-von-der-deutsch-franzoesischen-grenze-der-partner-wird-zum-fremden/25776812.html", "text_len": 13695, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wenn Helmut Kohl emotional wu", "found": true}, {"type": "with", "string": "en darf und vor allen Dingen nicht zwischen Deutschland und Frankreich.\u201c", "found": true}, {"type": "with", "string": "an der Grenze zu Frankreich ", "found": true}, {"type": "without", "string": "Jetzt weiterlesen", "found": false}, {"type": "without", "string": "Serviceangebote", "found": false}, {"type": "without", "string": "aktivieren", "found": false}]}
{"file": "herzundblut.com.Besuch.html", "url": "https://www.herzundblut.com/blog-1/kebbqe4kcwbrx62pr60i7gkd6mvlf7", "text_len": 5379, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In einer wundersch\u00f6nen Penthousewohnung", "found": true}, {"type": "with", "string": "Durch kulturelle Ausfl\u00fcge,", "found": true}, {"type": "with", "string": "Wie feiert es sich auf eurer 360", "found": true}, {"type": "without", "string": "Share", "found": false}, {"type": "without", "string": "Tags Homestory, Interior design, Berlin", "found": false}, {"type": "without", "string": "Everything i like..People, Photography, Interior", "found": false}]}
{"file": "ebrosia.de.zinfandel.html", "url": "https://www.ebrosia.de/beringer-zinfandel-rose-stone-cellars-lieblich-suess", "text_len": 3054, "tp": 4, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Das Bukett pr\u00e4sentiert sich", "found": true}, {"type": "with", "string": "Besonders gut passt er zu asiatischen Gerichten", "found": true}, {"type": "with", "string": "Details zum Artikel", "found": true}, {"type": "with", "string": "Dekantieren nicht notwendig", "found": true}, {"type": "without", "string": "Kunden kauften auch", "found": false}, {"type": "without", "string": "Gutschein sichern", "found": false}, {"type": "without", "string": "wurde erfolgreich hinzugef\u00fcgt.", "found": false}, {"type": "without", "string": "Bitte geben Sie die Zahlenfolge", "found": false}]}
{"file": "shingon-reiki.de.schamanismus.html", "url": "http://www.shingon-reiki.de/reiki-und-schamanismus/", "text_len": 6222, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u795e\u9053", "found": true}, {"type": "with", "string": "War Mikao Usui Schamane?", "found": true}, {"type": "with", "string": "Reiki und Runen", "found": true}, {"type": "without", "string": "Hinterlasse eine Antwort", "found": false}, {"type": "without", "string": "Catch Evolution", "found": false}, {"type": "without", "string": "und gekennzeichnet mit", "found": false}]}
{"file": "mitundvoneinander.com-Fr\u00fchling.html", "url": "https://mitundvoneinander.wordpress.com/2008/12/31/ratschlage-geben/", "text_len": 811, "tp": 0, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "PDF:", "found": false}, {"type": "without", "string": "Teilen Sie dies mit", "found": false}, {"type": "without", "string": "Gib das erste", "found": false}, {"type": "without", "string": "Dezember", "found": false}]}
{"file": "eishockeynews.de-halbfinale.html", "url": "https://www.eishockeynews.de/aktuell/artikel/2022/02/01/zweimal-kuusela-im-powerplay-und-ein-konter-muenchen-verliert-bei-tappara-tampere-mit-0-3-und-verpasst-das-chl-endspiel/c90d406b-2b41-4e98-b9cd-4aa661e512b2.html", "text_len": 3564, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Tappara ging dabei bereits nach rund", "found": true}, {"type": "with", "string": "sowie die bessere Struktur. So", "found": true}, {"type": "with", "string": "Saison 2021/22 und damit den Nachfolger", "found": true}, {"type": "without", "string": "DAS K\u00d6NNTE SIE AUCH INTERESSIEREN", "found": false}, {"type": "without", "string": "Wenn du Zeit am Computer", "found": false}, {"type": "without", "string": "Schwenningen, Landshut oder", "found": false}]}
{"file": "biobiochile.cl-gremios.html", "url": "https://www.biobiochile.cl/noticias/nacional/region-de-los-rios/2022/05/04/gremios-de-los-camioneros-no-descartan-nueva-movilizacion-realizaran-consulta-nacional.shtml", "text_len": 5903, "tp": 0, "fn": 3, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "En este contexto, la tarde", "found": false}, {"type": "with", "string": "consulta que se har\u00e1 este jueves", "found": false}, {"type": "with", "string": "suma protecci\u00f3n a la infraestructura", "found": false}, {"type": "without", "string": "\"A ver si se atreve a viajar\":", "found": false}, {"type": "without", "string": "visto ahora", "found": true}, {"type": "without", "string": "Hector Andrade", "found": false}]}
{"file": "crazy-julia.de.tipps.html", "url": "https://crazy-julia.de/beauty-tipps-die-jede-braut-kennen-sollte/", "text_len": 3400, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "in keinem Braut-Beauty-Programm fehlen darf?", "found": true}, {"type": "with", "string": "nicht nur vor der Hochzeit ein absolutes Muss.", "found": true}, {"type": "with", "string": "Gesundes, gl\u00e4nzendes Haar", "found": true}, {"type": "without", "string": "Neue Wandbilder von Posterlounge", "found": false}, {"type": "without", "string": "mit meinen Texten und mit meinen Gedanken.", "found": false}, {"type": "without", "string": "Erforderliche Felder sind mit * markiert.", "found": false}]}
{"file": "uepo.de.glossar.html", "url": "https://uepo.de/2020/04/26/digitales-woerterbuch-der-deutschen-sprache-redaktion-erstellt-glossar-zur-corona-pandemie/", "text_len": 4961, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Weiterf\u00fchrender Link", "found": true}, {"type": "with", "string": "randenburgischen Akademie der Wissenschaften (BBAW) die in Presse und Medien bereits sichtb", "found": true}, {"type": "with", "string": "c) [Milit\u00e4r] Strategie f\u00fcr den geordneten Abzug eines Truppenkontingents aus dem Auslandseinsatz", "found": true}, {"type": "without", "string": "Twitter-Kurznachrichten", "found": false}, {"type": "without", "string": "Mehr zum Thema auf UEPO.de", "found": true}, {"type": "without", "string": "Das \u00dcbersetzerportal UEPO.de ist seit 2001 die Tagesschau der \u00dcbersetzungsbranche im ", "found": false}]}
{"file": "wiki.python.org.Download.html", "url": "https://wiki.python.org/moin/BeginnersGuide/Download", "text_len": 3057, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "hey are available via the yellow download buttons on that page. ", "found": false}, {"type": "with", "string": "Before you start, you will need Python on your computer.", "found": true}, {"type": "with", "string": "general download page", "found": true}, {"type": "without", "string": "Unable to edit the page? See the FrontPage for instructions.", "found": false}, {"type": "without", "string": "Attachments", "found": false}, {"type": "without", "string": "Login", "found": false}]}
{"file": "wolfgangmichal.de.sorgfaltspflicht.html", "url": "https://www.wolfgangmichal.de/2017/06/07/publizistische-sorgfaltspflicht-statt-netzwerkdurchsetzungsgesetz/", "text_len": 9923, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die Repr\u00e4sentanten der Republik sind nerv\u00f6s. ", "found": true}, {"type": "with", "string": "verkaufen, muss jedes Unternehmen in die Bredouille bringen.", "found": true}, {"type": "with", "string": "EU-Urheberrechts-Richtlinie sogar bindend vorgeschrieben werden.", "found": true}, {"type": "without", "string": "verteidigt sie ihre Linie gegen die Zumutungen der Moderne.", "found": false}, {"type": "without", "string": "verhindert, sondern zu Geld gemacht werden.", "found": false}, {"type": "without", "string": "den Rechtspopulisten mehr n\u00fctzen als schaden.", "found": false}]}
{"file": "archive.org.tv-orange.de.future.html", "url": "https://web.archive.org/web/20130217080612/http://tv-orange.de/2012/08/future-of-hope-island-befreit-sich-von-den-bankstern-der-film/", "text_len": 3723, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Dieser Film wird bislang von den Kontinental-Europ\u00e4ischen Medien", "found": true}, {"type": "with", "string": "Ein Beispiel von Selbstzensur, symptomatisch f\u00fcr die Haltung gef\u00e4lliger", "found": true}, {"type": "with", "string": "Au\u00dferdem verbreitet sich \u00fcber Facebook die Information \u00fcber", "found": true}, {"type": "without", "string": "Hiesige Medien schw\u00f6ren die Bev\u00f6lkerung auf Gedeih", "found": false}, {"type": "without", "string": "In den von den Banken verursachten Immobilienblasen und unsauberen", "found": false}, {"type": "without", "string": "Wir haben Gutwettermacher, Medienmacher, Meinungsmacher, Schlechtwettermacher, Schuhmacher", "found": true}]}
{"file": "msn.com.university.html", "url": "https://www.msn.com/en-gb/news/uknews/uk-university-student-halls-too-full-to-be-safe-experts-warn/ar-BB19DUqK", "text_len": 9951, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "s increasing numbers of UK universities wrestle with", "found": true}, {"type": "with", "string": "seven days. In Northern Ireland, call your GP.", "found": true}, {"type": "with", "string": "Some UK universities, including Cambridge, Imperial College London", "found": true}, {"type": "without", "string": "powered by Microsoft News", "found": false}, {"type": "without", "string": "Sign in", "found": false}, {"type": "without", "string": "Commenting is not currently available, but don\u2019t worry", "found": false}]}
{"file": "0a24692a9ea846c1819bd6a5f92a8874.html", "url": "https://www.watson.ch/leben/drinks/453207266-sazerac-alles-ueber-den-cocktail-klassiker-aus-new-orleans", "text_len": 6091, "tp": 3, "fn": 2, "fp": 1, "tn": 4, "details": [{"type": "with", "string": "wo man in Z\u00fcrich", "found": false}, {"type": "with", "string": "1-2 Spritzer Peychaud", "found": true}, {"type": "with", "string": "Aber eigentlich kommt es f\u00fcr den Privatgebrauch", "found": true}, {"type": "with", "string": "mit Schweizer Einschlag", "found": true}, {"type": "with", "string": "Storming the Sazerac", "found": false}, {"type": "without", "string": "auf Twitter", "found": false}, {"type": "without", "string": "Nachtmodus ein", "found": false}, {"type": "without", "string": "Warum Trump jetzt Syrien um die Ohren fliegt", "found": false}, {"type": "without", "string": "Shot Happens", "found": false}, {"type": "without", "string": "Geht man auf die Anf\u00e4nge", "found": true}]}
{"file": "alpin.de-freeride.html", "url": "https://www.alpin.de/sicher-am-berg/skitouren/51490/artikel_quantum-free-asolo-factory-130-das-beste-aus-der-touring-und-der-freeride-welt-vereint.html", "text_len": 1406, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Spitzenklasse, der das Beste", "found": false}, {"type": "with", "string": "Die zweiteilige X Dual", "found": true}, {"type": "with", "string": "Der exklusive IF Touring", "found": true}, {"type": "without", "string": "Quantum Free Asolo Factory 130:", "found": false}, {"type": "without", "string": "Besonders komfortable Innenschuhe", "found": false}, {"type": "without", "string": "Thema Skitouren:", "found": false}]}
{"file": "katzen-forum.net-Pepe.html", "url": "https://www.katzen-forum.net/threads/jede-nacht-verliert-pepe-soviel-dreck-aus-dem-fell.230143/", "text_len": 1740, "tp": 1, "fn": 2, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "auf seiner beigefarbenen", "found": true}, {"type": "with", "string": "(Vor allem die \"Bettelm\u00e4nner\", wenn", "found": false}, {"type": "with", "string": "schon seit 5 Uhr drau\u00dfen", "found": false}, {"type": "without", "string": "das wirklich Katzenfl\u00f6he!?", "found": false}, {"type": "without", "string": "\u00c4hnliche Themen", "found": false}, {"type": "without", "string": "Katzen Forum", "found": false}]}
{"file": "laola1.at-barisic.html", "url": "https://www.laola1.at/de/red/fussball/bundesliga/news/rapids-barisic-geschlaucht---dann-hau--ich-mein-handy-zam-/", "text_len": 4059, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Business wird immer schnelllebiger", "found": true}, {"type": "with", "string": "Kampfmannschaft gekommen sind, die aus unserer Akademie", "found": true}, {"type": "with", "string": "Die Corona-Pandemie sorgt nicht nur f\u00fcr sportliche", "found": true}, {"type": "without", "string": "Status quo: Das passiert noch beim SK Rapid", "found": false}, {"type": "without", "string": "Action! Anna Gasser im Olympia-Interview", "found": false}, {"type": "without", "string": "WAC: \"Handschrift von Dutt verinnerlicht\"", "found": false}]}
{"file": "observer.com-LVMH.html", "url": "https://observer.com/2023/11/bernard-arnault-lvmh-louvre-chardin/", "text_len": 3644, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "For over a year, the Louvre has fought to acquire", "found": true}, {"type": "with", "string": "an 18th-century painting by Jean Sim\u00e9on Chardin for its national collection", "found": true}, {"type": "with", "string": "Now, the museum is receiving help in the form of 15 million euros", "found": true}, {"type": "without", "string": "Advertising Guidelines", "found": false}, {"type": "without", "string": "Editorial Ethics", "found": false}, {"type": "without", "string": "Do not sell my data", "found": false}]}
{"file": "der-erfolg-gibt-recht.de.rinderleber.html", "url": "http://www.der-erfolg-gibt-recht.de/rezepte/rinderleber-geschnetzeltes-mit-apfel-und-zwiebel.htm", "text_len": 1555, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "So sch\u00f6n winterlich ist es wie", "found": false}, {"type": "with", "string": "Und wie (fast) immer bei uns", "found": true}, {"type": "with", "string": "Dazu gab es bei uns selbst gemachten", "found": true}, {"type": "without", "string": "\u00a9 Liebe geht durch den Magen", "found": false}, {"type": "without", "string": "Holen Sie sich Ihre \u201eKostprobe\u201c", "found": false}, {"type": "without", "string": "Be Sociable, Share!", "found": false}]}
{"file": "francais.radio.cz-ministre.html", "url": "https://francais.radio.cz/le-ministre-de-la-sante-surpris-sans-masque-au-restaurant-8698000", "text_len": 5221, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "savoir qu'il lui cherchait", "found": true}, {"type": "with", "string": "Andrej Babi\u0161 a \u00e9galement", "found": true}, {"type": "with", "string": "de la Sant\u00e9 avait", "found": true}, {"type": "without", "string": "ARTICLES CORRESPONDANTS", "found": false}, {"type": "without", "string": "Pour faire face \u00e0 l\u2019\u00e9pid\u00e9mie", "found": false}, {"type": "without", "string": "Roman Prymula, photo:", "found": false}]}
{"file": "piratenpartei.at.grundeinkommen.html", "url": "https://www.piratenpartei.at/volksbegehren-zum-bedingungslosen-grundeinkommen-bge/", "text_len": 5580, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Aktuell liegt beim Innenministerium ein Volksbegehren", "found": true}, {"type": "with", "string": "Jetzt w\u00e4re der richtige Zeitpunkt", "found": true}, {"type": "with", "string": "Durch die aktuelle wirtschaftliche Hochlage ", "found": true}, {"type": "without", "string": "Please reload CAPTCHA.", "found": false}, {"type": "without", "string": "Theme based on the great work", "found": false}, {"type": "without", "string": "Getaggt mit", "found": false}]}
{"file": "creativecommons.ch.wie.html", "url": "http://www.creativecommons.ch/wie-funktionierts/", "text_len": 4555, "tp": 3, "fn": 0, "fp": 1, "tn": 1, "details": [{"type": "with", "string": "Sie k\u00f6nnen selber bestimmen", "found": true}, {"type": "with", "string": "Die Bedeutungen der Lizenzen", "found": true}, {"type": "with", "string": "Der durchgestrichene Dollar bedeutet", "found": true}, {"type": "without", "string": "Sofern nicht anders ausgewiesen", "found": true}, {"type": "without", "string": "Designed by Elegant Themes", "found": false}]}
{"file": "whiskyverkostung.com.halle.html", "url": "https://www.whiskyverkostung.com/termine-whisky-tastings-januar-mai-2020-halle-saale/5805", "text_len": 2200, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Auch im Jahr 2020 wird", "found": true}, {"type": "with", "string": "Termin: 29.02.2020, 19 Uhr", "found": true}, {"type": "with", "string": "Whikies aus verschiedenen Regionen Schottlands ", "found": true}, {"type": "without", "string": "Info & Anmeldungen", "found": false}, {"type": "without", "string": "Copyright \u00a9 2020 by: whiskyverkostung.com", "found": false}, {"type": "without", "string": "Der Beitrag wurde am Mittwoch", "found": false}]}
{"file": "selbst.de-wurmkiste.html", "url": "https://www.selbst.de/wurmkiste-39572.html", "text_len": 2376, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "kompostieren. In einer Wurmkiste", "found": true}, {"type": "with", "string": "foetida Kartoffelschalen oder Kaffeesatz", "found": true}, {"type": "with", "string": "Nachdem der Abfall in der obersten", "found": true}, {"type": "without", "string": "Selbst.de empfiehlt", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "Einfach", "found": true}]}
{"file": "rutgers.edu.robot.html", "url": "https://www.rutgers.edu/news/new-robot-does-superior-job-sampling-blood", "text_len": 3159, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "First clinical trial of an automated blood drawing and testing device", "found": true}, {"type": "with", "string": "nefiting patients and healthcare workers alike.", "found": true}, {"type": "with", "string": "from this study will be used to enhance artificial intelligence in the robot to improve its performance.", "found": true}, {"type": "without", "string": "You May Also Like", "found": false}, {"type": "without", "string": "University Operating Status", "found": false}, {"type": "without", "string": "ng. The university has move", "found": false}]}
{"file": "evang.at-lockdown.html", "url": "https://evang.at/lockdown-gottesdienste-bleiben-unter-strengen-auflagen-moeglich/", "text_len": 2305, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "in Pfarrgemeinden sollen als", "found": true}, {"type": "with", "string": "seien alle Presbyterien dringend", "found": true}, {"type": "with", "string": "Mit Verweis auf den Lockdown", "found": true}, {"type": "without", "string": "Foto: ccnull/Marco", "found": false}, {"type": "without", "string": "Aus dem Evangelium", "found": false}, {"type": "without", "string": "theologiebed\u00fcrftig", "found": false}]}
{"file": "geeks3d.com.hacklab.html", "url": "https://www.geeks3d.com/hacklab/20190110/python-3-simple-http-request-with-the-socket-module/", "text_len": 1782, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "This module provides access to the BSD socket interface", "found": true}, {"type": "with", "string": "Host:www.google.com", "found": true}, {"type": "with", "string": "http_response_len = len(http_response)", "found": true}, {"type": "without", "string": "(Demo) APP Launcher", "found": false}, {"type": "without", "string": "Demos: geexlab-demopack-python3/socket/01-socket-http-request/main.xml", "found": false}, {"type": "without", "string": "Your email address will not be published", "found": false}]}
{"file": "feuerwehrverband.de-vorbereitungstagung.html", "url": "https://www.feuerwehrverband.de/dfv-auf-der-vorbereitungstagung-der-interkulturellen-woche/", "text_len": 529, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "bundesweite Vorbereitungstagung der Interkulturellen", "found": true}, {"type": "with", "string": "Faktor 112", "found": true}, {"type": "with", "string": "Die eigentliche Interkulturelle Woche", "found": true}, {"type": "without", "string": "DFV-Experte Carsten Schneider", "found": false}, {"type": "without", "string": "Nach Anmeldung geht mir eine E-Mail", "found": false}, {"type": "without", "string": "Beitrag teilen", "found": false}]}
{"file": "vipflash.de-Ehezoff.html", "url": "https://vipflash.de/contents/176739-ehezoff-der-pochers-eskaliert-jetzt-schiesst-olli-gegen-amira-und-ihren-neuen?locale=en", "text_len": 1486, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Oliver Pocher sieht die Dinge jedoch anders und \u00e4u\u00dfert sich recht deutlich", "found": true}, {"type": "with", "string": "Exclusiv Weekend Spezial: Die Stars im NFL-Fieber", "found": true}, {"type": "with", "string": "sagt Pocher in einem Live-Interview mit Moderatorin Frauke Ludowig", "found": true}, {"type": "without", "string": "Blaulicht", "found": false}, {"type": "without", "string": "Datenschutz", "found": false}, {"type": "without", "string": "Kontakt", "found": false}]}
{"file": "digitale-exzellenz.de.gesundheitswesen.html", "url": "https://www.digitale-exzellenz.de/ki-china-teil-2-wie-das-fernost-facebook-das-gesundheitswesen-revolutioniert/", "text_len": 8355, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Nach einem Einblick in zwei k\u00fcnstlich intelligente Sicherheitsprojekt", "found": true}, {"type": "with", "string": "Chinas medizinische Versorgung ist, salopp gesagt, verbesserungsw\u00fcrdig: wenig ", "found": true}, {"type": "with", "string": "Weitere genutzte Quellen in englischer und chinesischer Sprache:", "found": true}, {"type": "without", "string": "Empfohlene Beitr\u00e4ge", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar ", "found": false}, {"type": "without", "string": "Process Mining und Verhaltensvielfalt miteinander", "found": true}]}
{"file": "hejfish.com-stephan.html", "url": "https://fischerhuette.hejfish.com/anglertalk-mit-stephan-hoeferer/", "text_len": 3033, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Zudem produziere er eigenst\u00e4ndige", "found": true}, {"type": "with", "string": "gibt es keine Angelpause im Jahr", "found": true}, {"type": "with", "string": "Ich liebe meine Brandenburger Gew\u00e4sser in ihrer", "found": true}, {"type": "without", "string": "Schreibe einen Kommentar", "found": false}, {"type": "without", "string": "Das k\u00f6nnte dich auch interessieren:", "found": false}, {"type": "without", "string": "Anglertalk mit", "found": false}]}
{"file": "boxen1.com-ring-r\u00fcckkehr.html", "url": "https://www.boxen1.com/morgen-abend-chris-eubank-jr-mit-ring-rueckkehr-gegen-liam-williams-60586/", "text_len": 1669, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Wochenende wieder in den Ring. Der", "found": true}, {"type": "with", "string": "\u201eGegen mich wird er den Schlussgong", "found": true}, {"type": "with", "string": "Monaten offizieller Pflichtherausforderer.", "found": true}, {"type": "without", "string": "BOXEN1-Award: Das sind Boxer, Boxerin,", "found": false}, {"type": "without", "string": "Promoter des Jahres 2021", "found": false}, {"type": "without", "string": "Chris Eubank Jr.", "found": true}]}
{"file": "cicero.de.pandemie.html", "url": "https://www.cicero.de/innenpolitik/corona-pandemie-es-kommt-auch-darauf-an-wie-die-menschen-sterben", "text_len": 9435, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Intensivbehandlung geht oder palliativ behandelt wird, ist ja die Patientenverf\u00fcgung.", "found": true}, {"type": "with", "string": "Wurde eine unn\u00f6tige Einweisung ins Krankenhaus verhindert?", "found": true}, {"type": "with", "string": "bei der Frage, wie wir die Krise bew\u00e4ltigen, nicht das einzige Kriterium sein kann", "found": true}, {"type": "without", "string": "Cicero Newsletter", "found": false}, {"type": "without", "string": "Moritz Gathmann leitet", "found": false}, {"type": "without", "string": "Sie sind leider nicht angemeldet", "found": false}]}
{"file": "antary.de.wireshark.html", "url": "https://www.antary.de/2017/06/29/wireshark-besuchte-urls-anzeigen-http-und-https/", "text_len": 4677, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wireshark m\u00f6glich ist, alle aufgerufenen", "found": true}, {"type": "with", "string": "Paketmitschnitt und eine aktuelle Version von Wireshark voraus. Beim", "found": true}, {"type": "with", "string": "angezeigt werden, was meiner Meinung nach komfortabler ist.", "found": true}, {"type": "without", "string": "Mit der Nutzung dieses Formulars erkl\u00e4rst du dich mit der Speicherung", "found": false}, {"type": "without", "string": "\u00dcber ein Geschenk von meine", "found": false}, {"type": "without", "string": "mich \u00fcber nachfolgende Kommentare per E-Mail.", "found": false}]}
{"file": "herrpfleger.de.fuelcell.html", "url": "https://herrpfleger.de/2019/10/new-balance-fuelcell-echo-bringt-speed/", "text_len": 715, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die FuelCell-Familie", "found": true}, {"type": "with", "string": "Das Retro-Design ist auf", "found": true}, {"type": "with", "string": "Mehr Infos auch auf der", "found": true}, {"type": "without", "string": "Medizinstudent, Papa, (ehemaliger)", "found": false}, {"type": "without", "string": "\u00dcber den Autor", "found": false}, {"type": "without", "string": "Schreib einen Kommentar", "found": false}]}
{"file": "verivox.de.finanzierung.html", "url": "https://www.verivox.de/kredit/leasing-oder-finanzierung/", "text_len": 8018, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "In diesem Ratgeber finden Sie Rechenbeis", "found": true}, {"type": "with", "string": "kann als Barzahler auftreten und einen Rabatt aushandeln.", "found": true}, {"type": "with", "string": "Die Drei-Wege-, Ballon- bzw. Vario-Finanzierung", "found": true}, {"type": "without", "string": "sachlich und geduldig", "found": false}, {"type": "without", "string": "Der Verivox-Newsletter", "found": false}, {"type": "without", "string": "in den Bereichen Energie, Telekommunikation, Versicherungen", "found": false}]}
{"file": "scinexx.com.ammoniak.html", "url": "https://www.scinexx.de/news/energie/ammoniak-spaltung-durch-leds-statt-hitze/", "text_len": 4730, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wegbereiter zu \u201egr\u00fcnem\u201c Wasserstoff?", "found": true}, {"type": "with", "string": "Eine g\u00fcnstigere Alternative", "found": true}, {"type": "with", "string": "\u201eDies ist der erste Bericht in der Fachliteratur,", "found": true}, {"type": "without", "string": "Zur\u00fcck zur Startseite", "found": false}, {"type": "without", "string": "Das k\u00f6nnte Sie auch interessieren", "found": false}, {"type": "without", "string": "In den Schlagzeilen", "found": false}]}
{"file": "jodel.com.advertising.html", "url": "https://advertising.jodel.com/", "text_len": 2251, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Was sorgt daf\u00fcr, dass deine Marke auf Jodel sicher ist?", "found": true}, {"type": "with", "string": "Visuelle und Text-Posts werden in einer 2. Stufe", "found": true}, {"type": "with", "string": "Lass dich inspirieren und starte deine Erfolgsgeschichte heute", "found": true}, {"type": "without", "string": "Welche Unternehmen bereits Jodel vertrauen", "found": false}, {"type": "without", "string": "Termin w\u00e4hlen", "found": false}, {"type": "without", "string": "All Rights Reserved.", "found": false}]}
{"file": "simplyscience.ch.erdoel.html", "url": "http://www.simplyscience.ch/teens-liesnach-archiv/articles/wie-entsteht-erdoel.html", "text_len": 2570, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Erd\u00f6l bildet nach Millionen", "found": true}, {"type": "with", "string": "Plankton zersetzt sich", "found": true}, {"type": "with", "string": "in unserem Artikel \"Warum wird das Erd\u00f6l knapp?\".", "found": true}, {"type": "without", "string": "TebNad/Shutterstock.com", "found": false}, {"type": "without", "string": "Empfiehl dies deinen Freunden.", "found": false}, {"type": "without", "string": "Die Natur ist aus chemischen Elementen aufgebaut", "found": false}]}
{"file": "d42c68f1b0f4408b81cf8f00bbe1a631.html", "url": "https://www.nzz.ch/international/der-nervenkrieg-um-den-brexit-geht-in-die-naechste-runde-ld.1516516", "text_len": 3320, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "eine Brexit-Verschiebung bei der EU beantragt", "found": true}, {"type": "with", "string": "\u00fcber den EU-Austritt Grossbritanniens gebracht. Eine Mehrheit ", "found": true}, {"type": "with", "string": "Dies k\u00f6nnte aus ihrer Sicht als Ersatz f\u00fcr den Grundsatzentscheid vom Samstag herhalten", "found": true}, {"type": "without", "string": "Niederlage f\u00fcr Boris Johnson \u2013 Britische Regierung will Brexit-Verschiebung beantragen", "found": false}, {"type": "without", "string": "Wagen Sie den anderen Blick mit unlimitiertem Zugang zur digitalen NZZ", "found": false}, {"type": "without", "string": "Haben Sie schon ein Benutzerkonto?", "found": false}]}
{"file": "sciencesetavenir.fr.rumeur.html", "url": "https://www.sciencesetavenir.fr/sante/covid-19-et-infox-comment-une-rumeur-devient-realite_147359", "text_len": 5704, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Aussi contagieuses que le virus ?", "found": true}, {"type": "with", "string": "contagieux (et potentiellement dangereux) que le SARS-CoV-2.", "found": true}, {"type": "with", "string": "popularit\u00e9 du sujet a explos\u00e9 suite \u00e0 ce", "found": true}, {"type": "without", "string": "L\u2019essentiel sant\u00e9", "found": false}, {"type": "without", "string": "A d\u00e9couvrir sur Challenges", "found": false}, {"type": "without", "string": "En images", "found": false}]}
{"file": "exlibris-deg.de.balsamo.html", "url": "http://www.exlibris-deg.de/2019/10/24/balsamo-stella-guido/", "text_len": 26336, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "M. Akt mit Axt einen Baum f\u00e4llend; Rem", "found": true}, {"type": "with", "string": "Adler nach Klippe, nach links blickend, Schooner im", "found": true}, {"type": "with", "string": "Exlibrissammlung PALMIRANI, Remo: Guido Balsamo Stella", "found": false}, {"type": "without", "string": "Winkler, Eduard", "found": false}, {"type": "without", "string": "Rechtliches", "found": false}, {"type": "without", "string": "German", "found": false}]}
{"file": "propellets.at.energie.html", "url": "https://www.propellets.at/soziale-energie", "text_len": 4824, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Besonders f\u00fcr Haushalte mit geringem Einkommen stellen steigende", "found": true}, {"type": "with", "string": "Ziel der vorliegenden Studie war es, zu kl\u00e4ren ob", "found": true}, {"type": "with", "string": "hohen Anfangsinvestition von rund 2700 \u20ac schwer erschwinglich.", "found": true}, {"type": "without", "string": "Newsletter", "found": false}, {"type": "without", "string": "teilen", "found": false}, {"type": "without", "string": "Alles \u00fcber den Verein", "found": false}]}
{"file": "wsl.ch-neubeau.html", "url": "https://neubau.wsl.ch/de/index.html", "text_len": 1450, "tp": 1, "fn": 0, "fp": 0, "tn": 1, "details": [{"type": "with", "string": "in der Grundlagenforschung t\u00e4tig und stellt", "found": true}, {"type": "without", "string": "Schachbrett", "found": false}]}
{"file": "xinhuanet.com.c_1125597921.html", "url": "http://www.xinhuanet.com/local/2020-02/19/c_1125597921.htm", "text_len": 1070, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "2\u670817\u65e5", "found": true}, {"type": "with", "string": "\u80fd\u8fc7\u5173\u3002", "found": true}, {"type": "with", "string": "\u8427\u6d77\u5ddd", "found": true}, {"type": "without", "string": "\u7ea0\u9519", "found": false}, {"type": "without", "string": "\u5173\u6ce8\u65b0\u534e\u7f51", "found": false}, {"type": "without", "string": "\u534a\u6708\u8c08", "found": false}]}
{"file": "schlosswirtjuval.it.geschichte.html", "url": "http://www.schlosswirtjuval.it/hof-geschichte/", "text_len": 6197, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Leider war dies nicht von langer Dauer, denn bereits 1581", "found": true}, {"type": "with", "string": "Den M\u00f6glichkeiten des Kommunikationszeitalters setzt er sein Unterwegssein", "found": true}, {"type": "with", "string": "alle 6 bis 14-j\u00e4hrigen Kinder der Juvaler H\u00f6fe zum Unterricht", "found": true}, {"type": "without", "string": "Messner Mountain Museum Juval", "found": false}, {"type": "without", "string": "+39 389 1976362 info@schlosswirtjuval.it", "found": false}, {"type": "without", "string": "Weingut & Hofbrennerei Unterortl", "found": false}]}
{"file": "dobszay.ch.geheimdiensten.html", "url": "https://www.dobszay.ch/2016-04-15/was-ist-der-unterschied-zwischen-privaten-und-staatlichen-geheimdiensten/", "text_len": 2482, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Die massenmediale Berichterstattung", "found": true}, {"type": "with", "string": "Seit vor allem das FBI Druck auf die Anbieter macht", "found": true}, {"type": "with", "string": "\u201eBellende Hunde beissen nicht\u201c ", "found": true}, {"type": "without", "string": "Stichwort-Wolke", "found": false}, {"type": "without", "string": "einige Rechte vorbehalten", "found": false}, {"type": "without", "string": "Neueste Beitr\u00e4ge", "found": false}]}
{"file": "ohneq.de.johannes.html", "url": "http://ohneq.de/ohneq/johannes/", "text_len": 668, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Mein Name ist Johannes aka ohneQ", "found": true}, {"type": "with", "string": "teile unsere Beitr\u00e4ge auf Facebook oder Twitter", "found": true}, {"type": "with", "string": "wenn Dir unsere Podcasts gefallen", "found": true}, {"type": "without", "string": "(c) Johannes Wolf", "found": false}, {"type": "without", "string": "Neueste Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Akte Aurora", "found": false}]}
{"file": "frau-sabienes.de.konsumsparen.html", "url": "https://frau-sabienes.de/konsumsparen-fazit/", "text_len": 6986, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Das Jahr 2019 stand", "found": true}, {"type": "with", "string": "Ich werde also weiterhin meinen Konsum einschr\u00e4nken", "found": true}, {"type": "with", "string": "Ich bin gerade am \u00dcberlegen", "found": true}, {"type": "without", "string": "Inzwischen ganze 60", "found": false}, {"type": "without", "string": "Hier bin ich auch noch unterwegs", "found": false}, {"type": "without", "string": "Vorschau auf den n\u00e4chsten Artikel", "found": true}]}
{"file": "royalroad.com.melas.html", "url": "https://www.royalroad.com/fiction/34798/melas/chapter/535107/chapter-1-prologue-murdered", "text_len": 12233, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "When I woke up, there was nothing.", "found": true}, {"type": "with", "string": "If it was limited to my birth, I", "found": true}, {"type": "with", "string": "Make me the most powerful spellcaster, or whatever", "found": true}, {"type": "without", "string": "Royal Road\u00ae is the home of web novels", "found": false}, {"type": "without", "string": "Royal Road\u00ae \u00a9 2013-2020, background by", "found": false}, {"type": "without", "string": "advertising fees by advertising and linking to amazon.com.", "found": false}]}
{"file": "toptal.com.python.html", "url": "https://www.toptal.com/python/top-10-mistakes-that-python-programmers-make", "text_len": 17562, "tp": 5, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "and code reuse.", "found": true}, {"type": "with", "string": "bar is optional", "found": true}, {"type": "with", "string": "What the $%#!&??", "found": true}, {"type": "with", "string": "And you then tried to do", "found": true}, {"type": "with", "string": "Familiarizing oneself with the key", "found": true}, {"type": "without", "string": "Martin has worked as", "found": false}, {"type": "without", "string": "delivered weekly.", "found": false}, {"type": "without", "string": "MCMC Methods:", "found": false}]}
{"file": "0b5db24739704283849ca3ed20ce09d4.html", "url": "https://www.rundschau-online.de/region/rhein-berg/bergischgladbach/pflaster-desaster-gladbacher-fussgaengerzone-in-schlechtem-zustand-33335514", "text_len": 3030, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "An manchen Stellen wirkt das Stra\u00dfenpflaster deutlich in die Jahre gekommen.", "found": true}, {"type": "with", "string": "\u201eWir h\u00e4tten es auch lieber anders, aber das Ver", "found": true}, {"type": "with", "string": "Auf den Zeitrahmen des Verfahrens habe die Stadt allerdings keinen Einfluss.", "found": true}, {"type": "without", "string": "Weitere interessante News", "found": false}, {"type": "without", "string": "Aktuelle Artikel", "found": false}, {"type": "without", "string": "damit die Stadt in einem Gerichtsverfahren Indizien vorlegen", "found": true}]}
{"file": "Unijne fundusze coraz bli\u017cej. Sejm zag\u0142osowa\u0142 _za_ - Polityka - rp.pl.html", "url": "https://www.rp.pl/Polityka/305049888-Unijne-fundusze-coraz-blizej-Sejm-zaglosowal-za.html", "text_len": 3854, "tp": 1, "fn": 2, "fp": 0, "tn": 5, "details": [{"type": "with", "string": "To jest moment fundamentalny", "found": true}, {"type": "with", "string": "Ci\u0119\u017car dyskusji przeniesie", "found": false}, {"type": "with", "string": "Na lepsz\u0105 konkurencyjno\u015b\u0107 gospodarki", "found": false}, {"type": "without", "string": "Licencja na publikacj\u0119", "found": false}, {"type": "without", "string": "Reklama", "found": false}, {"type": "without", "string": "Dowiedz si\u0119 wi\u0119cej", "found": false}, {"type": "without", "string": "Rafa\u0142 Guz", "found": false}, {"type": "without", "string": "Publikacja:", "found": false}]}
{"file": "diakonie.de-Lebensgef\u00fchl.html", "url": "https://www.diakonie.de/pressemeldungen/vorstellung-der-studie-lebensgefuehl-corona", "text_len": 2344, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Lebensgef\u00fchl der Menschen", "found": true}, {"type": "with", "string": "ist eine Studie der Evangelischen", "found": true}, {"type": "with", "string": "Online-Pressekonferenz", "found": true}, {"type": "without", "string": "Kathrin Klinkusch", "found": false}, {"type": "without", "string": "Hermann Bredehorst", "found": false}, {"type": "without", "string": "und Berufe bei der Diakonie", "found": false}]}
{"file": "gdp.de-Wertsch\u00e4tzung.html", "url": "https://www.gdp.de/gdp/gdp.nsf/id/DE_GdP-Vize-Klemmer-Mangelnde-Wertschaetzung-fuer-die-Beschaeftigten-des-oeD?open&ccm=000", "text_len": 1643, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Potsdam die bisherige Sprachlosigkeit", "found": false}, {"type": "with", "string": "Verhandlungsort wollen am", "found": true}, {"type": "with", "string": "5 Prozent, mindestens", "found": true}, {"type": "without", "string": "GdP L\u00e4nder & Bezirke", "found": false}, {"type": "without", "string": "GdP App 2.0", "found": false}, {"type": "without", "string": "Foto: GdP/Hagen Immel", "found": false}]}
{"file": "badische-zeitung.de-Wohnungssuche.html", "url": "https://www.badische-zeitung.de/viele-studierende-sind-noch-verzweifelt-auf-wohnungssuche-in-freiburg", "text_len": 279, "tp": 0, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gesine aus T\u00fcbingen l\u00e4uft die Zeit davon", "found": false}, {"type": "with", "string": "Die 18-J\u00e4hrige hat sich", "found": false}, {"type": "with", "string": "an der Uni Freiburg f\u00fcr ein Jurastudium eingeschrieben", "found": false}, {"type": "without", "string": "Weitere Artikel", "found": false}, {"type": "without", "string": "Abonnement hier k\u00fcndigen", "found": false}, {"type": "without", "string": "Kinder helfen Kindern", "found": false}]}
{"file": "threatpost.com.android.html", "url": "https://threatpost.com/android-ransomware-spreads-via-sex-simulation-game-links-on-reddit-sms/146774/", "text_len": 3668, "tp": 2, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "These messages include links to the ransomware", "found": true}, {"type": "with", "string": "using novel techniques to exfiltrate data.", "found": true}, {"type": "without", "string": "Share this article:", "found": false}, {"type": "without", "string": "Write a comment", "found": false}, {"type": "without", "string": "Notify me when new comments are added.", "found": false}, {"type": "without", "string": "uses Akismet to reduce spam.", "found": false}]}
{"file": "colours-of-the-soul.alhelm.net.html", "url": "http://www.colours-of-the-soul.alhelm.net", "text_len": 13185, "tp": 2, "fn": 1, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Einen Paralel-Scan", "found": true}, {"type": "with", "string": "1 Projektfahrplan-Brosch\u00fcre", "found": true}, {"type": "with", "string": "Aber es gibt noch den Sinn", "found": false}, {"type": "without", "string": "ein Buch-Gewinn", "found": false}, {"type": "without", "string": "Dann w\u00fcrde ich mich dar\u00fcber ", "found": false}]}
{"file": "0a12df42d1764095989ab078ee0f940b.html", "url": "https://www.zeit.de/2019/43/klimaschutz-banken-unternehmen-fracking-oelfoerderung-fossile-brennstoffe", "text_len": 936, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Weltweit finanzieren Banken und Investoren Unternehmungen", "found": true}, {"type": "with", "string": "wollten damit vor zwei Wochen die Verbindung zwischen der Wall Street", "found": true}, {"type": "with", "string": "JPMorgan Chase", "found": true}, {"type": "without", "string": "Bundesstaat Pennsylvania", "found": false}, {"type": "without", "string": "W\u00e4hlen Sie Ihren Zugang und lesen Sie weiter:", "found": false}, {"type": "without", "string": "Cookies & Tracking", "found": false}]}
{"file": "nymag.com.polarization.html", "url": "https://nymag.com/intelligencer/2020/05/polarization-republicans-democracy-ezra-klein-book-review.html", "text_len": 24349, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Which is to say, why was a solipsistic reality", "found": true}, {"type": "with", "string": "of its contradictions. As African-Americans migrated North in", "found": true}, {"type": "with", "string": "truth that our own identities are preventing", "found": true}, {"type": "without", "string": "This site is protected by reCAPTCHA and the Googl", "found": false}, {"type": "without", "string": "Daily news about the politics, business, and technolog", "found": false}, {"type": "without", "string": "\u00a9 2020 Vox Media, LLC. All rights reserved.", "found": false}]}
{"file": "Rosjanie sugeruj\u0105 natychmiastowe odci\u0119cie Polski od gazu - Energetyka24.html", "url": "https://energetyka24.com/rosjanie-sugeruja-natychmiastowe-odciecie-polski-od-gazu", "text_len": 3019, "tp": 3, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Rosjanie twierdz\u0105, \u017ce z", "found": true}, {"type": "with", "string": "Dani\u0119 do Polski.", "found": true}, {"type": "with", "string": "konkluduje finobzor.ru.", "found": true}, {"type": "without", "string": "ZOBACZ TAK\u017bE", "found": false}, {"type": "without", "string": "Reklama", "found": false}, {"type": "without", "string": "Prosimy o zaznaczenie", "found": false}, {"type": "without", "string": "Czy\u017cewski", "found": false}]}
{"file": "madymorrsion.com.energy.html", "url": "https://www.madymorrison.com/yoga/energy-rising", "text_len": 2623, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Der Fr\u00fchling steht bevor,", "found": true}, {"type": "with", "string": "F\u00fcr die Energy Rising \u2013 Challenge nutzen wir", "found": true}, {"type": "with", "string": "Nun w\u00fcnsch ich dir aber ganz viel Spa\u00df", "found": true}, {"type": "without", "string": "YOU MAY ALSO LIKE", "found": false}, {"type": "without", "string": "YOGA", "found": true}, {"type": "without", "string": "FOOD", "found": false}]}
{"file": "telegraph.co.uk.plumber.html", "url": "https://www.telegraph.co.uk/news/uknews/law-and-order/9209302/Plumber-jailed-after-boiler-killed-millionaires-daughter.html", "text_len": 4221, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "The deadly fumes leaked out of the dodgy boiler flue pipe", "found": true}, {"type": "with", "string": "The quality of work fell below your normal high standards", "found": true}, {"type": "with", "string": "sobbed in court as Hartley was led to begin his sentence", "found": true}, {"type": "without", "string": "More stories", "found": false}, {"type": "without", "string": "2:54pm", "found": false}, {"type": "without", "string": "Follow us on", "found": false}]}
{"file": "mein-haustier.de-hund.html", "url": "https://www.mein-haustier.de/hund/eat-small/", "text_len": 4171, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Nachhaltigkeit ist heutzutage ein wichtiges Thema", "found": true}, {"type": "with", "string": "Ressourcen ben\u00f6tigen, sind sie", "found": true}, {"type": "with", "string": "Alleinfutter f\u00fcr alle etwas ruhigeren Hunde", "found": true}, {"type": "without", "string": "Energy Snack", "found": true}, {"type": "without", "string": "\u00c4hnliche Artikel", "found": false}, {"type": "without", "string": "WALD Nassfutter", "found": true}]}
{"file": "neos.eu.wir.html", "url": "https://www.neos.eu/wir-sind-neos", "text_len": 2575, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Wir NEOS stehen seit 2012 f\u00fcr ein Neues \u00d6sterreich", "found": true}, {"type": "with", "string": "Seit dem Bestehen von NEOS mussten wir ein paar Verluste", "found": true}, {"type": "with", "string": "Demokratie braucht Parteien, die transparent", "found": true}, {"type": "without", "string": "Erfahre mehr", "found": false}, {"type": "without", "string": "Ich stimme der elektronischen Verarbeitung", "found": false}, {"type": "without", "string": "Folge uns", "found": false}]}
{"file": "bbc.com.52241221.html", "url": "https://www.bbc.com/news/world-us-canada-52241221", "text_len": 5556, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "ried in a mass grave in New York City, as the death toll from the coronavirus continues to rise.", "found": true}, {"type": "with", "string": "The daily rise in coronavirus deaths announced", "found": true}, {"type": "with", "string": "unemployment claims had topped", "found": true}, {"type": "without", "string": "Can we answer your question on the coronavirus?", "found": false}, {"type": "without", "string": "Four out of five jobs affected by virus globally", "found": false}, {"type": "without", "string": "Top Stories", "found": false}]}
{"file": "stardewvalleywiki.com.penny.html", "url": "https://stardewvalleywiki.com/Penny", "text_len": 36096, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Penny lives with her mom, Pam, in a little trailer by", "found": true}, {"type": "with", "string": "Penny is a villager who lives in Pelican Town", "found": true}, {"type": "with", "string": "A fermented beverage made from honey.", "found": false}, {"type": "without", "string": "Content is available under", "found": false}, {"type": "without", "string": "Privacy policy", "found": false}, {"type": "without", "string": "Admin noticeboard", "found": false}]}
{"file": "munich2022.com-topathleten.html", "url": "https://www.munich2022.com/de/europas-topathleten-fit-fur-munchen-2022", "text_len": 1299, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Weltjahresbestleistung von 6,02 m", "found": true}, {"type": "with", "string": "dass ich viel Selbstvertrauen habe,", "found": true}, {"type": "with", "string": "dass ich viel Selbstvertrauen habe,", "found": true}, {"type": "without", "string": "Getty Images", "found": false}, {"type": "without", "string": "Externer Inhalt", "found": false}, {"type": "without", "string": "Tags", "found": false}]}
{"file": "fitforfun.de.sozialeaengste.html", "url": "https://www.fitforfun.de/news/studie-zeigt-zwei-beliebte-lebensmittel-koennen-gegen-soziale-aengste-helfen-531297.html", "text_len": 2830, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Schon l\u00e4nger ist bekannt:", "found": true}, {"type": "with", "string": "Da der Darm und die Psyche eng", "found": true}, {"type": "with", "string": "Fermantation ist die chemische Umwandlung", "found": true}, {"type": "without", "string": "Quellen ausblenden", "found": false}, {"type": "without", "string": "Top-Themen bei FIT FOR FUN", "found": true}, {"type": "without", "string": "Meistgelesen", "found": false}]}
{"file": "Popkultur.de-Schauspieler.html", "url": "https://popkultur.de/homosexuelle-schauspieler/", "text_len": 14562, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "\u00dcber die Jahre hinweg haben homosexuelle Schauspieler", "found": true}, {"type": "with", "string": "ihren unverwechselbaren Stempel auf die Welt des Entertainments gesetzt.", "found": true}, {"type": "with", "string": "Trotz Hindernissen und Vorurteilen", "found": true}, {"type": "without", "string": "Neue Beitr\u00e4ge", "found": false}, {"type": "without", "string": "Die zehn besten & sch\u00f6nsten Smartwatches f\u00fcr Frauen", "found": false}, {"type": "without", "string": "Die 25 erfolgreichsten schwedischen S\u00e4nger & S\u00e4ngerinnen", "found": false}]}
{"file": "freiheit.org-\u00fcberlebende.html", "url": "https://www.freiheit.org/de/holocaust-ueberlebende-margot-friedlaender-wird-100-jahre", "text_len": 1470, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Gespr\u00e4ch mit Sabine", "found": true}, {"type": "with", "string": "Herzlichen Gl\u00fcckwunsch.", "found": true}, {"type": "with", "string": "Als eine der letzten", "found": true}, {"type": "without", "string": "Meist gelesen", "found": false}, {"type": "without", "string": "\u201eDie Eskalation geht", "found": false}, {"type": "without", "string": "Die Sorge unter der j\u00fcdischen", "found": false}]}
{"file": "gofeminin.de.horoskop.html", "url": "https://www.gofeminin.de/horoskop/liebeshoroskop-januar-2023-s4055611.html", "text_len": 6064, "tp": 2, "fn": 1, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Zeit f\u00fcr gro\u00dfe Gef\u00fchle?", "found": false}, {"type": "with", "string": "Im Januar sind Sie vertr\u00e4umt", "found": true}, {"type": "with", "string": "Doch nicht nur im Bett klappt es", "found": true}, {"type": "without", "string": "Folge uns \u00fcberall!", "found": false}, {"type": "without", "string": "wir haben viele spannende Themen", "found": false}, {"type": "without", "string": "Auch lesen:", "found": true}]}
{"file": "backen.de.maulwurfkuchen.html", "url": "https://backen.de/rezept/maulwurfkuchen-mit-erdbeeren", "text_len": 715, "tp": 2, "fn": 3, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "f\u00fcr 12 St\u00fcck", "found": false}, {"type": "with", "string": "z.B. Dr. Oetker Gelatine fix (15 g)", "found": false}, {"type": "with", "string": "F\u00fcr dieses Rezept ben\u00f6tigst", "found": true}, {"type": "with", "string": "Teigschaber", "found": true}, {"type": "with", "string": "und schneide sie in kleine W\u00fcrfel.", "found": false}, {"type": "without", "string": "Bild anzeigen", "found": false}, {"type": "without", "string": "Schreib du doch einen", "found": false}, {"type": "without", "string": "Neugierig geworden?", "found": false}]}
{"file": "libero.pe-ronaldo.html", "url": "https://libero.pe/futbol-internacional/2022/05/06/manchester-united-vs-brighton-en-vivo-via-star-plus-fox-sports-sky-sports-espn-2-premier-league-2022-cristiano-ronaldo-56304", "text_len": 3973, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "cinco del Arsenal. Eso s\u00ed, la desventaja", "found": true}, {"type": "with", "string": "As\u00ed fue el gol de Mois\u00e9s Caicedo que", "found": true}, {"type": "with", "string": "siendo una tarea muy dif\u00edcil, los dirigidos", "found": true}, {"type": "without", "string": "Barcelona: el d\u00eda que Ter Stegen", "found": false}, {"type": "without", "string": "Brighton gole\u00f3 al Manchester United por", "found": false}, {"type": "without", "string": "Manchester United vs. Brighton, en vivo: minuto", "found": true}]}
{"file": "docs.docker.com.install.html", "url": "https://docs.docker.com/engine/install/", "text_len": 5541, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Docker Desktop for Windows", "found": true}, {"type": "with", "string": "0.0.0-YYYYmmddHHMMSS-abcdefabcdef", "found": true}, {"type": "with", "string": "Please DO NOT file a public issue", "found": true}, {"type": "without", "string": "Installation per distro", "found": false}, {"type": "without", "string": "On this page:", "found": false}, {"type": "without", "string": "Toggle navigation", "found": false}]}
{"file": "futurezone.at.lyft.html", "url": "https://futurezone.at/digital-life/uber-konkurrent-lyft-startet-mit-waymo-robotertaxis-in-usa/400487461", "text_len": 2053, "tp": 2, "fn": 0, "fp": 0, "tn": 2, "details": [{"type": "with", "string": "Einige Kunden des Fahrdienst-Vermittler Lyft", "found": true}, {"type": "with", "string": "zeitweise rund vier Prozent.", "found": true}, {"type": "without", "string": "Allgemeine Nutzungsbedingungen", "found": false}, {"type": "without", "string": "Waymo bittet Autohersteller um Geld", "found": false}]}
{"file": "sueddeutsche.de.flixtrain.html", "url": "https://www.sueddeutsche.de/wirtschaft/bahn-flixbus-flixtrain-deutschlandtakt-fernverkehr-1.4445845", "text_len": 3904, "tp": 2, "fn": 0, "fp": 0, "tn": 4, "details": [{"type": "with", "string": "Bahn-Konkurrenten wie Flixbus f\u00fcrchten durch den geplanten Deutschlandtakt", "found": true}, {"type": "with", "string": "auch der Bus ein klimafreundliches Verkehrsmittel sei", "found": true}, {"type": "without", "string": "05:28 Uhr", "found": false}, {"type": "without", "string": "ICE im S-Bahn-Takt", "found": false}, {"type": "without", "string": "Diskussion zu diesem Artikel auf", "found": false}, {"type": "without", "string": "Berater-Aff\u00e4re bringt Bahnchef Lutz in Bedr\u00e4ngnis", "found": false}]}
{"file": "timesofisrael.com.washington.html", "url": "https://www.timesofisrael.com/state-of-washington-swears-in-first-native-american-jewish-supreme-court-justice/", "text_len": 4417, "tp": 3, "fn": 0, "fp": 1, "tn": 2, "details": [{"type": "with", "string": "Governor Jay Inslee appointed Montoya-Lewis", "found": true}, {"type": "with", "string": "I was raised to remember that I come", "found": true}, {"type": "with", "string": "At the ceremony, there was an invocation from", "found": true}, {"type": "without", "string": "Get The Times of Israel", "found": true}, {"type": "without", "string": "For as little as $6 a month", "found": false}, {"type": "without", "string": "Already a member? Sign in to stop seeing this", "found": false}]}
{"file": "interscenar.io.hoeren.html", "url": "http://www.interscenar.io/politik/eindruecke/was-wir-ueber-uns-nicht-hoeren-wollen", "text_len": 7968, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Viele ahnen es eigentlich schon, aber keiner", "found": true}, {"type": "with", "string": "So wie wir heute mit zwischenmenschlichen", "found": true}, {"type": "with", "string": "Und jetzt lassen Sie doch mal", "found": true}, {"type": "without", "string": "Den Artikel mit anderen teilen/diskutieren:", "found": false}, {"type": "without", "string": "hier bin ich eigentlich nur zuf\u00e4llig", "found": false}, {"type": "without", "string": "Theater- und Filmschauspielerin aus 2 Welten", "found": false}]}
{"file": "energiezukunft.eu.bioenergie.html", "url": "https://www.energiezukunft.eu/erneuerbare-energien/biomasse/bundesregierung-drosselt-bioenergie-branche-protestiert/", "text_len": 8111, "tp": 2, "fn": 1, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "Am vergangenen Freitag", "found": true}, {"type": "with", "string": "Die Absch\u00f6pfung von Erl\u00f6sen", "found": true}, {"type": "with", "string": " Die Bioenergieverb\u00e4nde im Hauptstadtb\u00fcro", "found": false}, {"type": "without", "string": "Mehr zum Thema", "found": false}, {"type": "without", "string": "TOP-THEMEN", "found": false}, {"type": "without", "string": "Magazine", "found": false}]}
{"file": "brasil247.com-militares.html", "url": "https://www.brasil247.com/regionais/brasilia/militares-enviaram-88-questoes-ao-tse-sobre-eleicoes-e-urnas-eletronicas", "text_len": 2344, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "supostos riscos e fragilidades", "found": true}, {"type": "with", "string": "vota\u00e7\u00e3o ainda era em c\u00e9dula de papel", "found": true}, {"type": "with", "string": "levantadas apesar de os \u00f3rg\u00e3os", "found": true}, {"type": "without", "string": "MAIS POPULAR", "found": false}, {"type": "without", "string": "(Foto: ABr)", "found": false}, {"type": "without", "string": "Fique por dentro do 247", "found": false}]}
{"file": "twincities.com-mayor.html", "url": "https://www.twincities.com/2023/11/08/st-louis-park-elects-a-new-mayor-apparently-the-first-somali-american-to-lead-a-u-s-city/", "text_len": 955, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": " What I had learned the first time is that this is just a milestone.", "found": true}, {"type": "with", "string": "It is not the destination", "found": true}, {"type": "with", "string": "Mohamed told the Sahan Journal.", "found": true}, {"type": "without", "string": "MOST POPULAR", "found": false}, {"type": "without", "string": "RELATED ARTICLES", "found": false}, {"type": "without", "string": "TRENDING NATIONALLY", "found": false}]}
{"file": "gormulus.wordpress.com.durfen.html", "url": "https://gormulus.wordpress.com/2012/12/11/das-wird-man-ja-wohl-noch-sagen-durfen/", "text_len": 5107, "tp": 3, "fn": 0, "fp": 0, "tn": 3, "details": [{"type": "with", "string": "leicht beratungsresistent erscheint.", "found": true}, {"type": "with", "string": "Ein regelrechter Hammer ist dann die Gleichsetzung von Gaza mit einem KZ.", "found": true}, {"type": "with", "string": "sobald ihre abstruse Gedankenwelt etwas n\u00e4her beleuchtet wird", "found": true}, {"type": "without", "string": "Mielke 2.0", "found": false}, {"type": "without", "string": "icken des JMStV gewidmet.", "found": false}, {"type": "without", "string": "Updates!", "found": false}]}
{"file": "btv.de-spuren.html", "url": "https://www.btv.de/de/spielbetrieb/news/auf-den-spuren-von-rafael-nadal.html", "text_len": 2415, "tp": 3, "fn": 0, "fp": 2, "tn": 1, "details": [{"type": "with", "string": "Februar 2022 in der TennisBase Oberhaching", "found": true}, {"type": "with", "string": "und diesmal sogar in der dritth\u00f6chsten", "found": true}, {"type": "with", "string": "findet am kommenden Wochenende", "found": true}, {"type": "without", "string": "Weitere Infos unter www.itfjuniors.de.", "found": true}, {"type": "without", "string": "Liam Gavrielides", "found": true}, {"type": "without", "string": "PARTNER", "found": false}]}