import spacy from collections import Counter import re as regex import os from saxonche import PySaxonProcessor #### Loads all of the necessary variables and functions. #nlp = spacy.cli.download("en_core_web_lg") nlp = spacy.load("en_core_web_lg") ######################################################################################### # ebb: After reading the NLP output, we know spaCy is making some mistakes. # So, here let's try adding an EntityRuler to customize spaCy's classification. We need # to configure this BEFORE we send the tokens off to nlp() for processing. ########################################################################################## # Create the EntityRuler and set it so the ner comes after, so OUR rules take precedence # Sources: # W. J. B. Mattingly: https://ner.pythonhumanities.com/02_01_spaCy_Entity_Ruler.html # spaCy documentation on NER Entity Ruler: https://spacy.io/usage/rule-based-matching#entityruler config = {"spans_key": None, "annotate_ents": True, "overwrite": True, "validate": True} ruler = nlp.add_pipe("span_ruler", before="ner", config=config) # 2023-04-07: ebb: NOTE: before="ner" setting seems to allow the spaCy NER rules to prevail over these patterns where # there is a conflict. # after="ner" means that the spaCy NER is TOTALLY OVERWRITTEN and invalidated by our patterns. # Notes: Mattingly has this: ruler = nlp.add_pipe("entity_ruler", after="ner", config={"validate": True}) # But this only works when spaCy doesn't recognize a word / phrase as a named entity of any kind. # If it recognizes a named entity but tags it wrong, we correct it with the span_ruler, not the entity_ruler patterns = [ {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "^-\w+?"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "^.$"}}]}, # ebb: Don't match on any single characters! {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "\^+"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "^\w\w$"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "^[a-z]+\s+[a-z]+$"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "^.*?__{2,}.*?$"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "CHRISTIAN(ITY|DOM)?"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "CHRISTIAN\s+NETWORK"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Catholic(ism)?"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "[A-Z]{2,}[A-Z][a-z]+"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "[a-z]{2,}[A-Z][a-z]+"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "^.*?[a-z][A-Z].*?$"}}]}, # ebb: Above line attempts to stop matching things like Oak IslandThe Method {"label": "NULL", "pattern": [{"TEXT" : {"REGEX": "^[Mm\-]+$"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "\w+cia\w+"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "fed\w+"}}]}, # SOCIALISMBY RICHARD # ebb: Above line attempts to stop matching things Mmm-mm or mm , etc. {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "TITIOUS CONCEPTS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "TORTIOUS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "THROUGHWAYS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "TARGET"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "NULL"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Sympathisers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Sympathy"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "UNTIL"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "UNCLE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "VCI"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "VISUALIZATION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "YOGA"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ack Canfield"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "aurem concepisti"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Xref"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Wspomnienia"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Untrustworthy"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Twelve Apostles"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Tsar"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Treasurer"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Thunderer"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Thou raisest"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Thou cleansest"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Thou castest"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "This Leopold the Traitor"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Swore"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Swastika"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Superstrings"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Subj"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Subterrene"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Sts"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Strength"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Sol Deus Invictus"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Skis"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Sect"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Sen"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Senza Aristotele noi"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Salubrious Living"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Saint vouches"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Safehaven"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SURPRISED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SURE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SUCCESSIVE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SUBSEQUENT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "STUNTS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "STREAMLINED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SPECULATION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SPECULA"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SOVEREIGN"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SHOCKED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SEPT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SAVIOR"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Roman Emperor"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Revelation"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Resurrection Bone"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Relearning"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Reason"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Read again Knocking the Key Weapon"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Rea"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "RESOLVE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "RESALE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "REBELS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "RATIFICATION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Qui"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Priest"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Price"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Popes"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Place"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Philosophizing"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Pharmacopaeia"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Pharaoh"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Pauline Privilege"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Paul the Persecutor"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Page"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Pagan Fathers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PWs"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PROPAGANDA"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PRIVILEGES"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PRIOR RESTRAINT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PRINCE satropic"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PRESERVATION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "POPE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer Brandt"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer Eichmann"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer Liebehenschel"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer Rauff"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer Rodl"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer Sievers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Obersturmbannfuehrer Walter Rauff"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "OPIUM CULTIVATION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Nutshell"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Numberless"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Num"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Northwest"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Northshore"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Northeast"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Ngo Dinh Diem"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Ngo Din Diem"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Nay"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "NAZI CARTEL"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "NATURE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Msgr"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Mother Goose"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Ministerially"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Martial Law Threat"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Marquis Who"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Mapmakers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Mao"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MIllbourn"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MEDLEY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MAR"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Lop"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "LYINGLY FOUNDED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Law"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "LAW"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Keys"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "KOD"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Juifs"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Judo"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Joseph the Carpenter"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Jerome arraigns"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Jack Built"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JUDAICA"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JURIS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JOINT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JHVH"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JESUS THE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JESUS DIED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Izvestiya VUZ"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Iron Shins"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Iren"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Infotechnology"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Inerrancy"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Imprimatur"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Imposture"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Implore"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Immortale Dei"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Illuminatus Lanz"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Illiterates Illiterates"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "INTELLECTUALS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "IMMOVABLE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "IMMIGRANT AZIZ Rehman"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ILLUNINATI USE MAFIAS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Hun"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Hoo boy"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Holy Virginity"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Holy Vehm"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Hoc Signo"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "His Covenant"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Henry the Navigator"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Heathens don"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "auptsturmfuehrer Truehe"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Hauptscharfuehrer Ruebe"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Hamstring Yugo"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "HYPERSPACE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "HUMANE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "HEED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "HEARINGS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Guillotine"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Grupenfuehrer Globocnik"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gruppenfuehrer Katzmann"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Groom"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gregory the Great"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Grammarians"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Grammar"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gospel"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gort"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Goebbelesque"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Godhead"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Girkalinei Comm"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Geschichte der Staatstheorien"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Genus Shamanensis"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Genius"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gene Pool"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gemeter"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gaude Virgo"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gamel Abdul Nasser"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gameplayers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Galicie Ukrainienne"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Gal"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GUNJAMMER"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GUILTY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GREED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GRAMS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GOVERNORS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GENIUS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GAER"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Furness"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Free Inq"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Foxx"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Foo Fighters"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Fig"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Figs"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Feverfew"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Feathers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Fathers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "FUNC"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "FOUO"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "FILES KIT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "FEVERFEW"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "FHK"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Exodus"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Eur"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Epistle clxvi"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Epistle"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Enfranchised"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Endothermic"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Encyc"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Encloged"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Emperor"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Emperor Vespasian"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Electromagnetically"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Ecclesiastici Publici"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Eccles"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Ebrietatis Enconium"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "EXTRAORDINAIRE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "EXPATRIATION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "EPISTLES"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ENORMOUS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "EMPLOY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Dupes"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Dueling Spymasters"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Dual Amiga"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Driver"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Dritte Reich"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Drang nach Osten"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Dorman"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Don sez"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Divinatione Daemonorum"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Distinguished paedagogists"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Dies irae"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Die Geschichte von Joel Brand"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Dew"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Deut"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Desert Rat"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Deregulatory Creep"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Der Weg des Politischen Katholizismus"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Depository"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Debasement"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Death Ray"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Das Sogenannte Boese"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CORRUPT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "COMMISSIONED THE UNDERSIGNED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CLEARFIELD"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Pagan Sibylline Oracles"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CIRCUMSTANTIAL"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CDT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CANNOT"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "BATF"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "BEEN"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "BLACKMAIL"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "BOURGEOIS GENTILHOMME"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Bagdad"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Balfour Declaration"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Battle"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Biblical"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Bishop"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Blade Runner"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Blackmail"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Blessing"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Briefly"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Brigadefuehrer"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Brigadefuehrer Globocnik"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Brigadefuehrer Gluecks"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Brigadefuehrer Zenner"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Brigadefuhrer Richard Glucks"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Brigadefuehrer"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Brigadefuhrer"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CREATORS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Cap"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Capitula Angilrammi"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Case"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Charles Mentesana Filmed"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Chillingworth"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Christian Pope"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Chronicles xxviii"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Coddled Omar Abdel Rahman"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Chronicles xxxiv"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Clem"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Commrce"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Corinthians"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Cosi"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Crucifixion"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Czar"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DECRETALS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DECAY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DEPLETION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DISASTROUS THAN PEARL"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DISEASES"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DOPE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Damit Ich"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Pagan Oracles"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Deceits"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Deep Cover"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Demagnetize"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Mona Lisa"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Demigod"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Demjanjuk"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Democratic Centralism"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Mein Kampf"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Mary Magdalin Gospel"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Horst Wessel Song"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Fama Fraternitatis"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Physiocrats"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Pagan"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Meo"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "PAGAN"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Obersturmfuehrer"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "MARTYRS"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Jurisconsults"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Jewess"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Jeremiads"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Jehovah's Witnesses"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Jehovah's Witness"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Jehovahs Witness"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "JURORS"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Heathens"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Gypsy"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Geronimo Chiricahua Apache"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Gauleiter"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Frankists"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Framers"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Framer"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Felloweraft"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Evangelist"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Egotists"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Duce"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Babylon(ia)?"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Diluvian Patriarchs"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Christiani\s*ty"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "CAIB"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the .+?"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Infidels"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Christiani"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MAHAT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Mahat"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Atta Boy"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Assailants"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Assassinated Robert"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Article"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Adrift"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MAD"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "bacchanalian"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "behests"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Parallel"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": ""}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?user"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "NETWORK"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Attemps"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Foundation"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Iena"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "attemps"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "pgh"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Christiani"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MAHAT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Mahat"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MAD"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Parallel"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?user"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "NETWORK"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Attemps"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Iena"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "attemps"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Advanced"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Believability"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Onesuch"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?People"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "REPRINT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "The\s+?Next\s+?Banking\s+?Crisis"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Incidently"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Martini\s+?Glass"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Customs"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?Sheriff"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Greets"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "bey"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "conven"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Pro"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "THUS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "TUNED CIRCUT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?supreme\s+?end"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Ebe"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Big\s+?Government"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "State"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "pseudoscientists"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "undam"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "News"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Times"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PERIODICALS"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SPEECHES"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "INCLUSION"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MAJESTY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "interpet"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "manifesta"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "aspetic"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "mish"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "petros"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "shevirat"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "sanguinis"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "resop"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "tryed"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "quandry"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "imbeds"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "germain"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "orleans"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "tgg"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Families"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "preparingits"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "germain"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "wintry"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "trogan"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Interested"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Time"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ACTUALLY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ACCIDENTALLY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "The\s+?Transmission"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "contra"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Mental\s+?Health"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Bill\s+?of\s+?Rights"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "MCCARREN\s+?ACT"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Emergency\s+?Detention\s+?Act"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Geneva\s+?Convention"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Official\s+?Secrets\s+?Act"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Executive\s+?Order"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "American\s+?Press\s+?freedom"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "State\s+?Constitution"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Constitution"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Martial\s+?Law"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Martial\s+?Rule"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Unalienable Rights"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Alaska\s+?Mental\s+?Health\s+?Bill"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Multilateral\s+?Protection\s+?of\s+?War\s+?Victims/Prisoners\s+?of\s+?War"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Multilateral\s+?Protection\s+?of\s+?War\s+?Victims/Civilian\s+?Persons"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Public\s+?Health\s+?Service\s+?Draft\s+?Act"}}]}, {"label": "LAW", "pattern": [{"TEXT": {"REGEX": "Uniform\s+?Mental\s+?Health\s+?Act"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Executive\s+?Order\s+?#[0-9]+"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Median"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Next"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Daily"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?General"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Diplomatic"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "televi"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "patsy"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "mike"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MODIFY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Nations"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "substanti"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "audi"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Justice"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Cancer"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Natural\s+?causes"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PLATO"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "darksuckers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Darksuckers"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "MAJESTY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SNOWBIRD"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GARNET"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "AGL"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DELTA"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the King"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "EXCALIBUR"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?secret\s+?control\s+?group"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JASON"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Heart"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "sentatives"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Peter\s+?Gregory\s+?Original"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Billy\s+?Lovelady\s+?Depository"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "The\s+?World"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "John\s+?Holbrook\s+?Psychiatrist"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Paul\s+?Mandal\s+?Life"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Jackson\s+?Life\s+?Magazine"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Drug"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "thou mayest"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "thou eatest"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Unity\s+?movement"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Conn"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "intel"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "xxx xxxxx"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Xxxxxx Xxxxxxxx"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Xxxxxxx Xxxxxxx"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Wie hoch"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "WOULDN"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Waar"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "WCH"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "WCR"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "yeldeth ben"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "zwite\s+?Aufseher"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "wuz"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "beeb"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "duetschen Juden"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "bison"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "enim pejor"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "enshroud"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "entorce"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "epidemica"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "blasphemously"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "bull dudu"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "bowie asst"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "canonizes"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "clarinews"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "columno"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "complicitly"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "conspiracy buff"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "creo"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "decrepid"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Motor\s+?Collision"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "pro\s+?tem"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Electrotherapeutic"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "megs"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "JRD"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "The Wealth"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "state"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Trade"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Atomic"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Expo"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "looney"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?Kingdom"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)??Office\s+?of\s+?Strategic\s+?Services"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Life\s+?Magazine"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Seattle\s+?Post\s+?Intellegencer"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "Industrias\s+?Cardoen"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "di"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "VENTURE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ALLEGED\s+?REAGAN"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Constitu"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "econonic\s+?aid"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Edgar\s+?Hoover"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "fed"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Apollo\s+?Astronauts"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?Temple"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CONNECTED\s+?WACKENHUT\s+?CORP"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "GREAT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Lung"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?Bill"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Said"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "CAPACITOR"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SPARK"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DAMPED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ANEW"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "THEREBY\s+?REDUCING\s+?EFFICIENCY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "HOWEVER"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "TAPPED"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ELECTRICALLY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ELECTRODE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "TUNED\s+?CIRCUT"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "WAVELENGTH"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "HORIZONTALLY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "THE\s+?OUDIN\s+?PRIMARY"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "AUTOTRANSFORMER"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the Allied"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?National"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Cheez\s+?Whiz"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "the\s+?Rich\s+?Discover\s+?Worthy"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Examiner"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "msen"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "ORG"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Physics\s+?A\.\s+?Mathematical"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "PALE"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Operation"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Order"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Command"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "jackboots"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "DARK"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "COLD"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Long\s+?Range"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "\S+@\S+\.\S+"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Human\s+?Behavior"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "SINCE\s+?LAWYERS\s+?OCCUPY"}}]}, {"label": "WORK_OF_ART", "pattern": [{"TEXT": {"REGEX": "Digha\s+?Nikaya"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "(Ludwig\s+?[Vv]an\s+?)?Beethoven"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Falangist"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Future\s+?of\s+?Freedom\s+?Foundation"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Congressional\s+?committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?The\s+?Federal\s+?Bureau\s+?of\s+?Prisons"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?Red\s+?Cross"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Annals\s+?of\s+?Internal\s+?Medicine"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Houston\s+?Post"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "MKULTRA"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "KTOK"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Houston\s+?Chronicle"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Concentration\s+?Camp\s+?Program"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Operation\s+?Garden\s+?Plot"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?federal\s+?government"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?British\s+?intelligence"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?JASON\s+?SOCIETY"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Composite\s+?Service\s+?Organization"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Psychological\s+?Operations\s+?Organization"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Council\s+?on\s+?Foreign\s+?Relations"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?Defense"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Mental\s+?Health\s+?Institution"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?Transportation"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?Justice"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?L\.E\.A\.F\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "Junio\s+?Valerio\s+?Black\s+?Prince\s+?Borghese"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Las\s+?Vegas\s+?Bullet"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?C\.I\.A\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?J\.C\.\s+?Penney"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?[Aa]-albionic\s+?Research"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Law\s+?Enforcement\s+?Assistance\s+?Force"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Young\s+?Americans\s+?for\s+?Freedom"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Military\s+?Police\s+?Unit"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Annals"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Inslaw"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "WACL"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "JDL"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "SJG"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "LEAA"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "Newe Anthropologie"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "NSTAC"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "NEWSBYTES"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "NDPC"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "National\s+?Democratic\s+?Policy\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "National\s+?Security\s+?Telecommunications\s+?Advisory\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "Tom Davis Research"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Civil\s+?Affairs\s+?Operations"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Civil\s+?Affairs\s+?Organization"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Big\s+?Brother"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Big\s+?brother"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?State\s+?Youthful\s+?Offenders\s+?Division"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?The\s+?California\s+?State\s+?Bar's\s+?Standing\s+?Committee\s+?on\s+?Professional\s+?Responsibility\s+?and\s+?Conduct"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?ILLUMINATI"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Crystic\s+?Institute"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Crystic\s+?institute"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?New\s+?World\s+?Order"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Roundtables"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Club\s+?of\s+?Rome"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Tri-lateral\s+?Commission"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Committee\s+?of\s+?300"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Alaska\s+?Bar\s+?Association"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Rose\s+?Law\s+?Firm"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?University\s+?of\s+?Wisconsin"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?University\s+?of\s+?Southern\s+?California"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?ROTC"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Plunge"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Fifth\s+?International\s+?Martin\s+?Luther\s+?King\s+?Tribunal"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Bayshore\s+?Inn"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Los\s+?Angeles\s+?Sheriff's\s+?Dept\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.N\.\s+?Security\s+?Council"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.N\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Daily\s+?Telegraph"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Alternative\s+?3"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Library\s+?of\s+?Congress"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?International\s+?Congress\s+?on\s+?Mental\s+?health"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Academy\s+?of\s+?Sciences"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.\s+?S\s+?.\s+?Secret\s+?Service"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Office\s+?of\s+?Thrift\s+?Supervision"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Comptroller\s+?of\s+?the\s+?Currency"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Urban\s+?Plunge"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Institute\s+?of\s+?Atmospheric\s+?Physics"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?State\s+?Department"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Libertarian\s+?Party"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Libertarian\s+?Party"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Bank\s+?of\s+?England"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?State"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?United\s+?Grand\s+?Lodge"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Board\s+?of\s+?General\s+?Purposes"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Recon\s+?Organization"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?G\.S\.A\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?United\s+?States\s+?Military\s+?Establishment"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?State\s+?Dept\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Sapata\s+?Oil"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?California\s+?National\s+?Guard"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?H\.U\.D\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Royal\s+?Bank\s+?of\s+?Canada"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Bank\s+?of\s+?Montreal"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Rockefeller\s+?Bank"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?Express"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Loeb\s+?Company"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?H\.E\.W\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?Senate"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Institute\s+?of\s+?Political\s+?Studies"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?law\s+?enforcement"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Housing\s+?&\s+?Urban\s+?Development"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?Education"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Dropa"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Fria Ord"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Haitian"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Astronauts"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "ISHVARA"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Wehrwirtschaftsfuehrer"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Viet\s+?Cong"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Egyptian"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Lybian"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Cuban"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Japanese"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Nicaraguan"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "African"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Indian"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Icelandic"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Russian"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "CANADIAN"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Clandestinism"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "SCIENTOLOGISTS"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Trilateralists"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Homo\s+?Sapiens"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Spaniard"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Freemason"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Freemson"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Freemasonry"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Masonic"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Vietnam\s+?Moratorium"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Homestead\s+?Air\s+?Force\s+?Base"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Moon"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Swartz\s+?Creek"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Marshall\s+?Fields"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Gulf\s+?of\s+?Mexico"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "DREAMLAND"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Pharselis"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Northlake"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Oak Cliff"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Paddington\s+?station"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "David\s+?Munson\s+?Air\s+?Base"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Southeast\s+?Asia"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Eielson\s+?Air\s+?Force\s+?Base"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "U\.S\.\s+?Army\s+?Reserves"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Bay\s+?of\s+?Pigs"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "US\s+?Air\s+?Force\s+?L\.\s+?Fletcher\s+?Prouty"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Bohemian\s+?Grove"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Broadway"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Mockingbird Lane"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Mockingbird"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "LAOS"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Hyannisport"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Lop Nor"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Gross Wannsee"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Groom Lake"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "North\s+?[A-Z][a-z]+"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Monk"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Northern"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Allanwood"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Roswell"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Westminster"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Portland"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Richmond"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Sacramento"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "St\s+?Louis"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "New\s+?Haven"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Milwaukee"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Little\s+?Rock"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Los\s+?Angeles"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Briton"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "El\s+?Paso"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Columbia"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "FORT\s+?HUNT"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Butte"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "State\s*College"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Williamsport"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Landsdale"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Newtown\s*Square"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Allentown"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "New\s*Castle"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Beckley"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Alton"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Stubenville"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Buffalo"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Belleville"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Bloomington"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Carbondale"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Champaign"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Constitantinoble"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Rock\s+?Island"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Birmingham"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "IRAQ"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "CANADA"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "ENGLAND"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Danvers"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "GERMANY"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Montreal"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Canada"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Baltimore"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Anchorage"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Albuquerque"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Albany"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "CORAL\s+?GABLES"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Washington,?\s*D\.?C\.?"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Avon\s+?Park"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Mill\s+?Point"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "El\s+?Reno"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Zagreb"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "ZAGREB"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Whiskey\s*Flat"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "site\s+?S-4"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "LUNA"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "AREA\s+?51"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "El\s+?Salvador\s+?air\s+?base"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Greenville\s+?County"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Toyland"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Sunday"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Sun"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "North\s+?Pole"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Qua\s+?Vieaf"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "North\s+?Viet\s*[Nn]am"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Owl's\s+?Nest"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Dachau"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Hill\s+?Billies"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Cave\s+?Man's"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Cherry\s+?Brook\s+?Valley"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Postbridge"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "McDill\s+?Air\s+?Force\s+?Base"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Egland\s+?Air\s+?Force\s+?Base"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Nazareth"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Latin\s+?America"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "GREAT\s+?BRITAIN"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "U\.S\.S\.R"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "New\s+?York\s+?City"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Soviet\s+?Union"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Viet\s+?Nam"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "U\.S\.A\."}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "U\.S\."}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "U\.S"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Saudi\s+?Arabia"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Washington,\s+?DC"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "the\s+?Vatican"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?British\s+?Empire"}}]}, {"label": "GPE", "pattern": [{"TEXT": {"REGEX": "Pennsylvania"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Warren\s+?Commission"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Tesla\s+?Electric\s+?Company"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Hahn\s+?group"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?Department\s+?of\s+?Health\s+?and\s+?Human\s+?Services"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?Council\s+?of\s+?Life\s+?Insurance"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Health\s+?Insurance\s+?Association\s+?of\s+?America\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?District\s+?Court"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?United\s+?States\s+?Pacific\s+?Fleet"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Pacific\s+?Fleet"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Guard"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Christic\s+?Institute"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Nugan-Hand"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Military-Industrial\s+?complex"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Condon\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "COMMUNICATIONS\s+?CANADA"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?ABC"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?CBS"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Unity\s+?movement"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Covert\s+?Action"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?General\s+?Electric"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?US\s+?Army"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?US\s+?Navy"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?London\s+?Underground"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?US\s+?Justice\s+?Department"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Sur\s+?Coester"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Colorado\s+?Springs\s+?Gazette"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?SoftQuad\s+?Inc\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?United\s+?Nations\s+?World\s+?Health\s+?Organization"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?World\s+?Health\s+?Organization"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?L\.E\.A\.A\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Justice\s+?Dept\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "(THE\s+?)?HOUSE\s+?JUDICIARY\s+?COMMITTEE"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Contemporary\s+?Research,\s+?Inc\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?British\s+?Government"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?House\s+?Select\s+?Committee\s+?on\s+?Assassinations"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Office\s+?of\s+?Criminal\s+?Justice\s+?Planning"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?Defense\s+?of\s+?the\s+?United\s+?States"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?Commerce"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?MAJIC"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "Mother\s+?Jones"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?W\.A\.\s+?Harriman\s+?&\s+?Co\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Securities\s+?C\.\s+?Commission"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Rockefeller\s+?Syndicate"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dallas\s+?Citizens\s+?Council"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Round\s+?Table\s+?groups"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Devon\s+?Unidentified\s+?Flying\s+?Objects\s+?centre"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?San\s+?Francisco\s+?Sidewalk\s+?Astronomers\s+?Association"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dartmoor\s+?Livestock\s+?Protection\s+?Society"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Animal\s+?Defence\s+?Society"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?Agriculture\s+?Department"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Perpetual\s+?Hidden\s+?Government"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Office\s+?of\s+?the\s+?Deputy\s+?Chief\s+?of\s+?Staff\s+?of\s+?Personnel"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Harriman\s+?Fifteen\s+?Corp\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Israeli\s+?secret\s+?service"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Bell\s+?Helicopter"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Eurocheque"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?MasterCard"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?CitiCorp"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Marconi\s+?company"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Marconi"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?NRO"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Illinois\s+?Bell\s+?Telephone\s+?Company"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?UFO\s+?Magazine"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?University\s+?of\s+?Toronto"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Taymar,\s+?Inc\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Kerr\s+?McGree\s+?Nuclear\s+?Corporation"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Edward\s+?R\.\s+?Murrow\s+?Center"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?Ship\s+?and\s+?Commerce\s+?Corp\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?government"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Silverado\s+?Savings\s+?&\s+?Loan"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?Association\s+?for\s+?the\s+?Advancement\s+?of\s+?Science"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?G\.H\.\s+?Walker\s+?&\s+?Co\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Office\s+?of\s+?Preparedness"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Aeronautics\s+?and\s+?Space\s+?Agency"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Martin\s+?Marietta\s+?company"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?John\s+?Birch\s+?Society"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?government"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Cleveland\s+?Field\s+?Office"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "The\s+?John\s+?F\.\s+?Kennedy\s+?Center\s+?for\s+?the\s+?Performing\s+?Arts\s+?Education\s+?Program"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?United\s+?States\s+?government"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Institute\s+?of\s+?Agrarian\s+?Reform"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Institute\s+?of\s+?Mental\s+?Health"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?INRA"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Massachusetts\s+?Institute\s+?of\s+?Technology"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?International\s+?UFO\s+?Bureau"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Investigations\s+?Committee\s+?on\s+?Aerial\s+?Phenomena"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dept\.\s+?of\s+?the\s+?Army"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?Air\s+?Force"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?University\s+?of\s+?Arizona"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Criminal\s+?Justice\s+?System"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Sheriffs\s+?Dept\."}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "Standard\s+?&\s+?Poors"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Federal\s+?Reserve"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?L\.E\.A\.A\.\s+?Newsletter"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Texas\s+?School\s+?Book\s+?Depository"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Senate\s+?Select\s+?Committee\s+?on\s+?Intelligence"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Senate\s+?Intelligence\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?House\s+?Committee\s+?on\s+?Assassinations"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?House\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?House\s+?Select\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?House\s+?of\s+?Saud"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "Wackenhut"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "KPFA"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "WACKENHUT\s+?CORP"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?International\s+?Agency\s+?for\s+?Research\s+?on\s+?Cancer"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?The\s+?London\s+?Times"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "WACKENHUT"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Federal\s+?Emergency\s+?Management\s+?Agency"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Special\s+?Forces\s+?Unit"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Defense\s+?Central\s+?Index"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Joint\s+?Chiefs\s+?of\s+?Staff"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Federal\s+?Information\s+?Center"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?Counter-intelligence\s+?Corps"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "CIC"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?British\s+?Establishment\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "[A-Z][a-z]+\s+([A-Z]\.\s+[A-Z][a-z]+)?(,\s+Jr\.)"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "[A-Z][a-z]+\s+([A-Z]\.\s+[A-Z][a-z]+)?(\s+Jr\.)"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "[A-Z][a-z]+\s+(([A-Z]\.\s+)?[A-Z][a-z]+([A-Z][a-z]+)?)?\s+Jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "[[A-Z][a-z]+\s+[A-Z]\.\s+([A-Z][a-z])?[A-Z][a-z]+"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Nostradameus"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Harrison\s+?Edward\s+?Livingstone"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.\s+?Herbert\s+?Sawyer"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "L\.\s+?Harmon\s+?Zeigler"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "C\.\s+?Everett\s+?Koop"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Edward\s+?L\.\s+?van\s+?Roden"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Kirschbaum"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Raphael\s+?Shumacker"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Martin\s+?Marietta"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "DAVID\s+?MELLOR"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.\s+?W\.\s+?Willmott"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "O'Neill"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "O'Neil"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "O'Neal"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Orsenigo"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Neil\s+?Bush"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "SWAMI\s+?VIVEKANANDA"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Morris\s+?Ellowitz"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Harry\s+?Thon"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "David\s+?Ferrie"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Darrell\s+?W\.\s+?Garner"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "David\s+?Goldstein"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mona\s+?B\.\s+?Saenz"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Abraham\s+?Zapruder"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Clayton\s+?Fowler"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "WILLIAM\s+?L\.\s+?LAW"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Reynolds"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Marriner S. Eccles"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "H\.S\.M\.\s+?Coxeter"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "A\.D\.\s+?Bowie"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Phillip\s+?Geraci"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "E\.R\.\s+?Walthers"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "George\s+?McGann"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Perry\s+?Russo"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "JOHN\s+?PHILIP\s+?NICHOLS"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "SALVADOR\s+?ALLENDE"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "D\.\s+?CASOLARO"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "AFFIDAVIT"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Koreshan"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Koresh"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Carl\s+?Oglesby"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Earline\s+?Roberts"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lee\s+?Bowers,\s+?Jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Locust"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Starmaster"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Nuri\s+?Al-Said"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Pamela\s+?Courson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Jimmy\s+?Hendrix"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Faisal\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Milton\s+?Cooper"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mostafa\s+?A\s+?Abdelkader"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Abdul\s+?Llah"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Marc\s+?J\.\s+?Seifer"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "R\.\s+?J\.\s+?Biggar"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Stanford\s+?White"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?Paul\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?Paul\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ensign\s+?Ball"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "O\.H\.\s+?Cril"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Crill"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "KRLL"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "KRLLL"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "EBE"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Rockefeller\s*III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s*?D\.\s*Rockefeller\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Dennis\s+?DeConcini"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Phil\s+?Gramm"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "BILL\s+?HAMILTON"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gramm"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "DeConcini"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Michael\s+?Emerling"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Rockefeller"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Johnston"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Dodd"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Laurence\s*Rockefeller"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+D\.\s*Rockefeller"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+D\.\s*Rockefeller\s*IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+D\.\s*Rockefeller,\s*Jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s*H\.\s*Draper\s*III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Eduardo"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "EARL\s*W\.\s+?BRIAN"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "RICONOSCIUTO"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ramakrishna"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Don\s+?Ecker"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?Galt"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "C\.D\.\s+?Jackson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "G\.H\.\s+?Walker\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Daniel\s+?Gooch"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ramses\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alexander\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alexander\s+?V"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alexander\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alexander\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Breck\s+?Wall"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "CARROLL\s+?QUIGLEY"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Swami\s+?Vivekananda"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "DOOLITTLE"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "James\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Oswald\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Oswald\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Umberto\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Nikola\s+?Tesla"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Tesla"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "C\.\s+?Hamilton\s+?Ellis"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alfred\s+?Ely\s+?Beach"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ed\s+?Vyrdolak"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Beach"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lord\s+?Milner"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Agapetus\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Agapetus\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "C\.\s+?Victor\s+?Raiser\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "C\.V\.\s+?Raiser\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Boniface\s+?VIII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Boniface\s+?VII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Boniface\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Boniface\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Boniface\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gonda"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ollie\s+?North"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Oliver\s*North"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mr\.\s*North"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "E\.\s+?Howard\s+?Hunt"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "MLK"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "RFK"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "O\.\s+?W\.\s+?Judd"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "C\.J\.\s+?Duffner"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.P\.\s+?Morgan"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Richard\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "James\s+?McDonald"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "McDonald"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Saunders"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Richard\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "George\s+?Terwilliger\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "C\.E\.\s+?Koop"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Callistus\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Francis\s+?von\s+?Hapsburg"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Malcom\s+?X"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Paramahansa\s+?Yogananda"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Victor\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Carles\s+?C\.\s+?Messick\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?D\.\s+?Rockefeller\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "MARCONI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Marconi"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Bill\s+?English"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Bill\s+?Cooper"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?W\.\s+?Bailey\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?McKee"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?X"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?V"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Jerome\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mark\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?XXIII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ferdinand\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Hillary\s+?Rodham\s+?Clinton"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Vincent\s+?Foster,\s+?jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Nicholas\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Nicholas\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Nicholas\s+?V"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Vespasian"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?Zajac"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Sylvester\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Sylvester\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Engenius\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Philip\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Stephen\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Stephen\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Pious\s+?X"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Honorius\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Sergius\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Adrian\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Adrian\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?F\.\s+?Hamilton\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "James\s+?Baker\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?Stamps\s+?Farish\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Elizabeth\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Anacletus\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Edward\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Edward\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Edward\s+?V"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Matthew\s+?XVI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Vyrdolak"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Thothmes\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Harry\s+?Hurt\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Napoleon\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Clement\s+?VIII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Clement\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Clement\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Clement\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Pius\s+?X"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Pius\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Pius\s+?IX"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Pius\s+?XI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Pius\s+?XII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Leo\s+?IX"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Leo\s+?X"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Leo\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Leo\s+?XIII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Amenhotep\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?W\.\s+?Bailey\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Constantine"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Tut-ankh-amen"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Sixtus\s+?V"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Sixtus\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Benedict\s+?XIV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Benedict\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Benedict\s+?IX"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Benedict\s+?XV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "George\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "George\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gregory\s+?VII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gregory\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gregory\s+?XVI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gregory\s+?IX"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Constantine\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Albert\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Albert\s+?V\.\s+?Bryan\s+?Jr"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alfonso\s+?XII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alfonso\s+?XIII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gustavus\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gustav\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Felix\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Valentinian\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Innocent\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Innocent\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Frederick,\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Frederick\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Theodosius\s+?I"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Henry\s+?VIII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Henry\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Henry\s+?IV"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Louis\s+?IX"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Louis\s+?XVI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Joseph\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Catherine\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "James\s+?D\s+?Bryant\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Paul\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Paul\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Julius\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Paul\s+?VI"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Baldwin\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Urban\s+?VIII"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?Goodhue,\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Edwin\s+?Meese,\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Thomas\s+?Downing"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Thomas\s+?E\.\s+?Davis"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.A\.\s+?Milteer"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?Cabell"}}]}, {'label': 'PERSON', 'pattern': [{'TEXT': {'REGEX': 'James\s+?"Bo"\s+?Gritz'}}]}, {'label': 'PERSON', 'pattern': [{'TEXT': {'REGEX': 'Mike\s+?"Chucky"\s+?Peters'}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "James\s+?Earl\s+?Ray"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Earl\s+?Wheeler"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?S\.\s+?Thompson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "S\.\s+?Rilling"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ralph\s+?Paul"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Scott\s+?Weekly"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ford,\s+?L\.H"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "A\.\s+?Vilenkin"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Renate\s+?Viebahn"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lustick,\s+?Ian\s+?S\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Friedman,\s+?Robert\s+?I\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Howard\s+?Sprague"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mark\s+?Clark"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Owen"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Theodore\s+?Shackley"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "DeLesseps\s+?Morrison"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Betty\s+?McDonald"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Clines"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "L\.\s+?F\.\s+?Prouty"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "L\.\s+?Fletcher\s+?Prouty"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Knight,\s+?Amy\s+?W\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Martindale"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "R\.\s+?Knox"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Leon\s+?Oswald"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "H\.\s+?Ross\s+?Perot"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Stanly\s+?R\.\s+?Larsen"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "L\.E\.\s+?Allen\s+?Jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "A\.\s+?Lewis"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "D\.\s+?Fleming"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.\s+?Edgar\s+?Hoover"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "V\.\s+?Pirie"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Nancy\s+?B\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ronald\s+?Reagan"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "P\.\s+?Gibbs"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "W\.\s+?Citrine"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "E\.\s+?Moore"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lyndon\s+?Johnson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John(\s*F\.?)\s*Kennedy"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Zia\s+?ul-Haque"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ronald\s*Payne"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "R\.\s*Muldoon"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "F\.\s*Orr"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Frank\s+?H\.\s+?Schwable"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "R\.\s+?F\.\s+?Doyle"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "David\s+?Munson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Frances\s+?Clark"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "G\.\s+?Gordon\s+?Broadbent"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.\s+?Segal"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "F\.\s+?Brangwyn"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Luc\s+?Montagnier"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "A\.\s+?Luchaire"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "L\.\s+?Segal"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "R\.\s+?William\s+?Davis"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?C\.\s+?Sullivan"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?W\.\s+?Quinn"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?R\.\s+?Pabst"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Oliver\s+?Nichelson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "James\s+?Worrell,\s+?Jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Hank\s+?Suydam"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?Pabst"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "G\.\s+?Maeferren"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Dian-Lanz"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Buria"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "North"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ortho\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Swami\s+?Nikhilananda"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Santo\s+?Trafficante"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Felix\s+?Rodreguez"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Stanly\s+?F\.\s+?Yoles"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "G\.\s+?B\.\s+?Chisholm"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Baron\s+?Kurt\s+?von\s+?Schroeder"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "George\s+?Bush"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Roland\s+?Harriman"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?Foster\s+?Dulles"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Sherman\s+?Skolnick"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Francis\s+?G\.\s+?Powers"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Kenneth\s+?O'Donnell"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.M\.\s+?English"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?Sullivan"}}]}, {'label': 'PERSON', 'pattern': [{'TEXT': {'REGEX': 'C\.L\. "Lummie" Lewis'}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Garland\s+?Slack"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Billy\s+?Lovelady"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?Holbrook"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Marguerite\s+?Oswald"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Andrew\s+?Cetti"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Will\s+?H\.\s+?Griffin"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Peter\s+?Gregory"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Harry\s+?Grindell-Matthews"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Grindell-Matthews"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Rosenholtz"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Karen\s+?Silkwood"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "N\.\s+?McQuire"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?Highland"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Harriman"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?Saxby"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Ellis\s+?O\.\s+?Briggs"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Daniel\s+?Ludwig"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Robert\s+?C\.\s+?Klowers"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Tatum\s+?B\.\s+?Laird"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?F\.\s+?Buckley,\s+?Jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "William\s+?Randolph\s+?Hearst,\s+?Jr\."}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Justin\s+?Dart"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Larry\s+?McDonald"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mac\s+?MacPherson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "MacPherson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Callen"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lievense"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "CASTRO"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Erik\s+?Jonsson"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Charles\s+?E\.\s+?Allen"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Laurence\s+?H\.\s+?Shoup"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "David\s+?Rieff"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "David\s+?Rockefeller"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Diamond"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Donald\s+?DeFreeze"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "McGovern"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "McCarthy"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?DiNardo"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gyeorgos\s+?C\.\s+?Hatonn"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?Connally"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lyndon\s+?LaRouche"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "LaRouche"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "W\.H\.\s+?Bowart"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alan\s+?H\.\s+?Belmont"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Alan\s+?Belmont"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Joseph\s+?C\.\s+?Ayres"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lehrman"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "John\s+?McCone"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Al\s+?Haig"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.\s+?Latimer\s+?Clark"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "T\.\s+?W\.\s+?Rammell"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Elizabeth\s+?II"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Martha\s+?Honey"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Vince\s+?Bielski"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Anton\s+?Chaitkin"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Dean\s+?Burch"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Burch"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gaius\s+?Caesar"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Gaius\s+?Chaerea"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "McCone"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Richard\s+?Nixon"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "David\s+?Wise"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Zapruder"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mortimer\s+?J\.\s+?Adler"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Angela\s+?Davis"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Segals"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "COLIN\s+?WALLACE"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Thomas\s+?B\.\s+?Ross"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "JACOB\s+?G\.\s+?HORNBERGER"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Bowart"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Frank\s+?H\.\s+?Schwable"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Billy\s+?Goodman"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Leonard\s+?Pullin"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "R\.\s+?J\.\s+?Biggar"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "David\s+?R\.\s+?Hunter"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Hugh\s+?Everett,\s+?III"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Sigmund\s+?Diamond"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "J\.\s+?Pierpont\s+?Morgan"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Montagnier"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "W\.\s+?Schmunger"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Mary\s+?Pat\s+?Flaherty"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Vince\s+?Bielski"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Lee\s+?Harvey\s+?Oswald"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Schmunger"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Stranglove"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "James\s+?Calcutt"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Florentine\s+?Giovanni\s+?Boccaccio"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Prescott\s+?Bush"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Maxwell"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Daniel\s+?Schorr"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Allard\s+?K\.\s+?Lowenstein"}}]}, {"label": "PERSON", "pattern": [{"TEXT": {"REGEX": "Daniel\s+?Patrick\s+?Moynihan"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Institute\s+?of\s+?Health"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Department\s+?of\s+?Justice"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Yakuza"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "YAKUZA"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Citizens'\s+?Committee\s+?to\s+?Clean\s+?Up\s+?the\s+?Courts"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Bank\s+?of\s+?Criminals\s+?and\s+?Conspirators\s+?International"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?Department\s+?of\s+?Justice"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?U\.S\.\s+?Justice\s+?Department"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?FBI\s+?Field\s+?Office"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Bureau\s+?of\s+?Investigation"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Dallas\s+?Citizens\s+?Council"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?University\s+?of\s+?Maryland,"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Carnegie\s+?Corporation"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Katzenbach\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Democratic\s+?Congress"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Endowment\s+?for\s+?Democracy"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Congress\s+?for\s+?Cultural\s+?Freedom"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Cambridge\s+?University\s+?Press"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Association\s+?of\s+?National\s+?Security\s+?Alumni"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Avon\s+?Books"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?American\s+?Psychiatric\s+?Association"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Ministry\s+?of\s+?Defence"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Ramparts\s+?Press"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Grove\s+?Press"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Association\s+?of\s+?Scholars"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Council\s+?on\s+?Foreign\s+?Relations"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Symbionese\s+?Liberation\s+?Army"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Washington\s+?Post"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Internal\s+?Revenue\s+?Service"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Terminate\s+?With\s+?Extreme\s+?Prejudice"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Center\s+?for\s+?Strategic\s+?and\s+?International\s+?Studies"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?School\s+?of\s+?Foreign\s+?Service"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?The\s+?Anglo-American\s+?Establishment"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Centre\s+?of\s+?Eternity"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Life\s+?magazine"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Full\s+?Disclosure\s+?Newspaper"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "North\s+American\s+Newspaper\s+Alliance"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Trilateral\s+?Commision"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Ruling\s+?Elite"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?US\s+?Congress"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Church\s+?Committee"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?National\s+?Academy\s+?of\s+?Sciences"}}]}, {"label": "ORG", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Ramparts"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Bab"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Century"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "The\s+?Problem"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Air\s+?Force\s+?One"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Kingdom\s+?of\s+?God"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Grassy\s+?Knoll"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Frankfurt\s+?airport"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Dealey\s+?Plaza"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Central\s+?Africa"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Fort\s+?Detrick"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Area-51"}}]}, {"label": "LOC", "pattern": [{"TEXT": {"REGEX": "Clifton\s+?suspension\s+?bridge"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "mandkind"}}]}, {"label": "NULL", "pattern": [{"TEXT": {"REGEX": "Motor"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "AIDS\s+?virus"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "AIDS"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "AIDS-1"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "AIDS\s+?VIRUS"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Human\s+?Adult\s+?Leukemia\s+?virus"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "LAV"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Malaria"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "ARC"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "HTLV-1"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "HTLV-III"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "HTLV"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "HIV"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "HIV\s+?virus"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Sheep\s+?Visna\s+?Virus"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Pneumocystis\s+?carinii\s+?pneumonia"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Kaposi's\s+?sarcoma"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Smallpox"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Polio"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Gunshot"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "LSD"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Poison"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "MHz"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "TNT"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Acquired\s+?Immuno-Deficiency\s+?Syndrome"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Equal\s+?Opportunity\s+?Employer"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "Visna"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "visna"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "visna\s+?virus"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Korean\s+?War"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "National\s+?Jury\s+?Rights\s+?Day"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Miranda\s+?Case"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "World\s+?War\s+?II"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Second\s+?World\s+?War"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "KRISTALLNACHT"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "First\s+?World\s+?War"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "World\s+?War\s+?I"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Parliament\s+?of\s+?Religions"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "JFK\s+?assassination"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Apollo\s+?14\s+?mission"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Apollo\s+?11"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "([Tt]he\s+?)?Andrew\s+?Cetti\s+?Affair"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Railway\s+?Mania"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "EVENT"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "CHRISTIAN ERA"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "ante-Niccne"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Vietnam\s+?War"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Project\s+?Red-light"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Moon\s+?mission"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "UFO"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Apollo\s+?11"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Johnson's\s+?war\s+?on\s+?poverty"}}]}, {"label": "MISC", "pattern": [{"TEXT": {"REGEX": "AIDS"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Chinesse"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Vietnamese"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "Identified\s+?Alien\s+?Crafts"}}]}, {"label": "EVENT", "pattern": [{"TEXT": {"REGEX": "IAC"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "multiculturalists"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Vietnamese"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Anglo-Saxon"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Patriots"}}]}, {"label": "NORP", "pattern": [{"TEXT": {"REGEX": "Patriot"}}]}, ] ruler.add_patterns(patterns) workingDir = os.getcwd() CollPath = os.path.join(workingDir, '../pre-src-xml') outputPath = os.path.join(workingDir, '../src-xml') # Everything in original conspiracy directory. insideDir = os.listdir(CollPath) print(insideDir) # Copies files in case they do not exist def copyTextFiles(file): content = [] # Reads the contents of file, and saves each line of file into the content array. with open(CollPath + "/" + file, 'r', encoding='utf8') as inFile: for line in inFile: content.append(line) print(" ~~~~~~~~~~~~~~~~~~~~~~~~~~~ copying " + file + " ~~~~~~~~~~~~~~~~~~~~~~~~~~~ ") inFile.close() # With the contents copied, a loop will go through the array and write it all in a new file in output folder. with open(outputPath + "/" + file, 'w', encoding='utf8') as f: for line in content: f.write(str(line)) # Function runs through the tokens of given file. Entities are stored in array, then returned. Called by regexFile(). def entitycollector(tokens): # creates a new file that includes all of the found entities. with open('conspPERSON.txt', 'w') as f: entities = {} # goes through each entity in the token list. for ent in sorted(tokens.ents): entityInfo = [ent.text, ent.label_] stringify = str(entityInfo) f.write(stringify) f.write('\n') entities[ent.text] = ent.label_ # return all entities with its label and text. return entities # Function runs regex through given file. def regexFile(file): fileDir = os.path.join(outputPath, file) with PySaxonProcessor(license=False) as proc: # grabs the original xml file and stores it in a variable for later. this some xquery bs xml = open(fileDir, encoding='utf-8').read() xp = proc.new_xpath_processor() node = proc.parse_xml(xml_text=xml) xp.set_context(xdm_item=node) # xquery goes through original text, and stores it all in a single string. xpath = xp.evaluate('//p ! normalize-space() => string-join()') string = str(xpath) # regex goes through the text and deletes anything that is not a letter or space. cleanedText = regex.sub(r'[^A-z ]+', ' ', string) cleanedText = regex.sub(r'\n+', ' ', cleanedText) # gets the tokens of the clean text. tokens = nlp(cleanedText) wrappedText = xml # grabs all the entities in file and stores it in a list/array. dictEntities = entitycollector(tokens) # if anything exists in the list, the following code will run. if dictEntities: # it will check through each entity in the list and see its entity type. it is looking for "PERSON" tokens # in this instance, which includes of nouns and names. for entity in dictEntities.keys(): if dictEntities[entity] == "PERSON" or dictEntities[entity] == "LOC" or dictEntities[entity] == "ORG" or dictEntities[entity] == "GPE" or dictEntities[entity] == "NORP" or dictEntities[entity] == "EVENT": # key_template variable is the elements we wrap around found instances. key_template = "" + entity + "" # loops through wrappedText until all entities are wrapped. wrappedText = wrappedText.replace(entity, key_template) # Saves newly wrapped elements and then writes it into new file. with open(fileDir, 'w', encoding='utf8') as f: f.write(wrappedText) print("WRAPPING " + entity) checkTags(file) # ebb: Added above line to send the tagged file to the checkTags() function for cleaning. # This part of the code is a WIP. # ebb: I just activated it, and it works! (Nice job.) I altered it just a bit. May need more regexes to match. ## It tries to find weird or invalid elements/tags and fix them. def checkTags(file): content = [] fileDir = os.path.join(outputPath, file) with open(fileDir, 'r', encoding='utf8') as inFile: for line in inFile: content.append(line) # With the contents copied, a loop will go through the array and write it all in a new file in output folder. with open(fileDir, 'w', encoding='utf8') as f: for line in content: # match = regex.search(r"([^<>]*?)]+?>([^<>]+?)([^<>]*?)", line) # if match: # print("broken line found, fixing...") # ebb: NOTE: IF this function only processes a line when there's a regex match, we'd have a serious problem: # we'd not output the rest of the file--only the cleaned matches. So the output files would be mostly empty! # Better to just string-clean every line using regex.sub(). Where there's no regex match, no substitution will happen. origLine = line # newLine = regex.sub(r"([^<>]*?)]+?>([^<>]+?)([^<>]*?)", r"\1\2\3",line) # cial> newLine = regex.sub(r"((cia)(l>)", r"\1\2\3", origLine) newLine = regex.sub(r"([^>])(New\s+?York\s+?Times)([^<])", r"\1\2\3", newLine) newLine = regex.sub(r"([^>])(British)([^<])", r"\1\2\3", newLine) newLine = regex.sub(r"([^>])(New\s+?York(\s+?City)?)([^<])", r"\1\2\4", newLine) newLine = regex.sub(r"(Sundays?)", r"\1", newLine) newLine = regex.sub(r"(North)([a-z]*\s+[A-Z][a-z]+)*", r"\1\2", newLine) newLine = regex.sub(r"(North\s+o?f?\s*([A-Z][a-z]+\s+)+)", r"\1", newLine) # newLine = regex.sub(r"(<)(di)(v>)", r"\1\2\3", newLine) newLine = regex.sub(r"([^<]*?)([^<]+?)([^<]*?)", r"\1\2\3", newLine) newLine = regex.sub(r"([^<]*?)([^<]+?)([^<]*?)", r"\1\2\3", newLine) newLine = regex.sub(r"([^<]*?)([^<]+?)([^<]*?)", r"\1\2\3", newLine) newLine = regex.sub(r"([^<]*?)([^<]+?)([^<]*?)", r"\1\2\3", newLine) newLine = regex.sub(r"([^<]*?)([^<]+?)([^<]*?)", r"\1\2\3", newLine) newLine = regex.sub(r"([^<]*?)([^<]+?)([^<]*?)", r"\1\2\3", newLine) # ebb: I'm repeating the above just in case of the weird event of triple or quadruple nested tags in tags. # We saw it happen on the LOTR project and running it through multiple passes of the above line ultimately got rid of them all # preserving only the outermost tags. newLine = regex.sub(r"((ORG)('>)", r"\1\2\3", newLine) newLine = regex.sub(r"()(\w+)(\w+)()", "\1\2 \3\4", newLine) newLine = regex.sub(r"()(\w+)\s+?()(\w+)()(\w+)()(\w+)()()", r"\1\2 \4 \6 \8\9", newLine) # ebb: Problem line below: eliminates John Kennedy's # newLine = regex.sub(r"(\w+)('\w)", r"\1\2", newLine) # # cial> # <div> if origLine != newLine: print("broken line found, fixing...") print(origLine + "\n INTO.") print(newLine) f.write(str(newLine)) print("File checking finished.") for file in insideDir: copyTextFiles(file) regexFile(file) #checkTags(file) # ebb: You don't really want to activate checkTags here, # because it would run over the untagged input files.