/
searchindex.js
1 lines (1 loc) · 104 KB
/
searchindex.js
1
Search.setIndex({"docnames": ["analyze/entities", "analyze/overview", "analyze/phrases", "analyze/processing", "analyze/questions", "analyze/tokens", "analyze/tomotopy", "analyze/what", "clean/cleaning", "clean/dataframes", "clean/overview", "clean/scrape", "clean/sketch", "generate/fine-tune", "generate/hf", "generate/inference", "generate/ml", "generate/overview", "generate/soon", "intro", "intro/data-types", "intro/lists", "intro/logic", "intro/loops", "intro/overview", "intro/script", "intro/variables", "scrape/ethics", "scrape/explore", "scrape/inspector", "scrape/legiscan_api", "scrape/overview", "scrape/scrape", "scrape/what"], "filenames": ["analyze/entities.ipynb", "analyze/overview.md", "analyze/phrases.ipynb", "analyze/processing.ipynb", "analyze/questions.md", "analyze/tokens.ipynb", "analyze/tomotopy.ipynb", "analyze/what.md", "clean/cleaning.ipynb", "clean/dataframes.ipynb", "clean/overview.md", "clean/scrape.ipynb", "clean/sketch.ipynb", "generate/fine-tune.ipynb", "generate/hf.md", "generate/inference.ipynb", "generate/ml.ipynb", "generate/overview.md", "generate/soon.md", "intro.md", "intro/data-types.ipynb", "intro/lists.ipynb", "intro/logic.ipynb", "intro/loops.ipynb", "intro/overview.md", "intro/script.md", "intro/variables.ipynb", "scrape/ethics.md", "scrape/explore.ipynb", "scrape/inspector.md", "scrape/legiscan_api.ipynb", "scrape/overview.md", "scrape/scrape.ipynb", "scrape/what.md"], "titles": ["the <code class=\"docutils literal notranslate\"><span class=\"pre\">Entity-Ruler</span></code>", "workshop overview", "the <code class=\"docutils literal notranslate\"><span class=\"pre\">PhraseMatcher</span></code>", "the <code class=\"docutils literal notranslate\"><span class=\"pre\">spaCy</span></code> pipeline", "research questions: defining gender", "the token <code class=\"docutils literal notranslate\"><span class=\"pre\">Matcher</span></code>", "<no title>", "what is text analysis?", "cleaning our text", "dataframes", "workshop overview", "scraping our text", "dataframes: import libraries", "fine-tuning", "Huggingface\ud83e\udd17 platform", "running inference", "machine learning", "workshop overview", "coming soon!", "\u201cIntro to Python for Working with Text\u201d workshop series", "data types", "lists", "logic", "loops", "workshop overview", "opening challenge", "variables", "what is ethical? what is legal?", "exploring <code class=\"docutils literal notranslate\"><span class=\"pre\">bs4</span></code>", "the HTML Inspector", "Legiscan API", "workshop overview", "scraping with <code class=\"docutils literal notranslate\"><span class=\"pre\">bs4</span></code>", "what is web scraping?"], "terms": {"from": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 16, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 33], "name": [0, 1, 6, 7, 8, 9, 11, 12, 14, 15, 21, 26, 28, 29, 32, 33], "recognit": [0, 1, 7, 10, 16, 27, 30, 31], "ar": [0, 1, 2, 3, 4, 5, 7, 8, 9, 11, 12, 13, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "label": [0, 2, 3, 5, 7, 13, 26, 28, 30], "ad": [0, 2, 3, 6, 21, 28, 30, 32], "certain": [0, 4, 7, 20, 22, 28, 32], "word": [0, 2, 3, 5, 6, 7, 13, 14, 15, 17, 20, 21, 22, 23, 26, 28], "number": [0, 2, 4, 6, 9, 10, 12, 13, 16, 20, 21, 28, 31, 32], "fit": [0, 20], "within": [0, 1, 3, 4, 7, 8, 9, 11, 15, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 32], "categori": [0, 4, 28, 32], "like": [0, 1, 2, 3, 4, 5, 7, 8, 11, 12, 14, 15, 16, 17, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 32, 33], "person": [0, 3, 5, 13, 16, 25, 27, 28, 32], "place": [0, 2, 3, 4, 7, 21, 27], "time": [0, 2, 3, 4, 5, 6, 12, 13, 14, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32], "date": [0, 3, 9, 11, 12, 28], "These": [0, 3, 7, 8, 14, 16, 26, 28], "repres": [0, 2, 8, 11, 12, 16, 21, 26, 28], "rel": [0, 28, 31, 32], "import": [0, 2, 3, 5, 6, 7, 8, 9, 11, 13, 14, 15, 16, 20, 21, 22, 26, 27, 28, 30, 32], "data": [0, 1, 2, 3, 4, 5, 7, 8, 10, 11, 12, 14, 16, 19, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 33], "which": [0, 2, 3, 4, 5, 6, 7, 8, 11, 12, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "why": [0, 9, 11, 20, 21, 22, 27, 33], "ner": [0, 1, 5], "pick": [0, 2], "them": [0, 2, 3, 5, 7, 8, 11, 14, 15, 16, 20, 21, 26, 27, 28, 30, 31, 32], "out": [0, 2, 3, 4, 5, 8, 9, 11, 12, 14, 15, 16, 19, 20, 21, 22, 23, 26, 27, 28, 30, 33], "By": [0, 1, 7, 16, 19, 21, 25, 27, 28], "custom": [0, 2, 3, 5, 6, 10, 16, 17, 19], "short": [0, 8, 11, 12, 28, 29], "we": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 28, 29, 30, 32, 33], "can": [0, 1, 2, 3, 4, 5, 7, 8, 9, 11, 13, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33], "defin": [0, 2, 5, 8, 23, 27, 28, 31, 32], "own": [0, 2, 4, 7, 8, 20, 26, 27, 28, 33], "instruct": [0, 3, 7, 11, 12, 14, 19, 23, 28], "how": [0, 1, 2, 3, 4, 5, 7, 9, 10, 13, 14, 15, 16, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "find": [0, 2, 4, 7, 8, 11, 12, 14, 15, 16, 19, 32, 33], "entit": [0, 3, 5], "choos": [0, 14, 22], "For": [0, 2, 3, 4, 5, 6, 7, 11, 16, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 33], "thi": [0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "project": [0, 1, 19, 27, 28, 33], "captur": [0, 2, 5, 13, 15, 25, 27], "phrase": [0, 5, 7, 28], "relat": [0, 4, 5, 7, 9, 11, 12, 28, 32], "gender": [0, 2, 5, 10, 12, 13, 16, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32], "sex": [0, 2, 4, 5, 13, 15, 27, 28, 31, 32], "male": [0, 4, 5, 15, 28, 32], "femal": [0, 4, 5, 13, 15, 28, 32], "exampl": [0, 2, 3, 4, 5, 7, 15, 16, 20, 21, 23, 26, 27, 28, 29, 33], "after": [0, 2, 3, 5, 11, 12, 13, 15, 16, 21, 27, 28, 30], "want": [0, 2, 4, 5, 8, 12, 13, 15, 19, 20, 21, 23, 26, 27, 28, 29, 32, 33], "At": [0, 3, 17, 27, 28, 32, 33], "end": [0, 1, 2, 3, 5, 14, 15, 17, 21, 25, 26, 27, 28, 32, 33], "pass": [0, 3, 10, 12, 13, 15, 22, 23, 26, 28, 31, 32], "dataset": [0, 2, 3, 5, 7, 9, 11, 13, 16, 17, 22, 23, 27, 28, 31, 32], "bill": [0, 2, 4, 8, 9, 10, 12, 19, 27, 28, 29, 30, 31], "through": [0, 2, 3, 4, 5, 10, 11, 12, 19, 22, 23, 28, 30, 32, 33], "pipelin": [0, 2, 6, 13, 15], "go": [0, 3, 11, 12, 14, 15, 16, 21, 23, 25, 27, 28, 29, 32, 33], "entir": [0, 21, 28], "process": [0, 1, 2, 3, 4, 5, 6, 7, 10, 11, 13, 15, 16, 17, 19, 20, 21, 22, 26, 27, 28, 33], "onc": [0, 8, 21, 23, 25, 27, 28, 29], "more": [0, 2, 3, 4, 5, 6, 7, 8, 10, 11, 14, 15, 16, 19, 20, 21, 22, 23, 26, 27, 28, 29, 31, 32, 33], "pipe": [0, 3, 6, 13, 15], "here": [0, 1, 2, 3, 4, 7, 8, 11, 14, 15, 16, 21, 22, 23, 26, 27, 28, 30, 32, 33], "step": [0, 2, 3, 4, 5, 6, 8, 9, 12, 13, 15, 21, 29, 30], "order": [0, 2, 4, 9, 11, 12, 22, 28, 30], "exact": [0, 2], "you": [0, 1, 2, 3, 4, 5, 6, 8, 11, 13, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "re": [0, 2, 3, 4, 5, 8, 9, 11, 12, 16, 20, 26, 27, 28, 30], "look": [0, 2, 7, 8, 12, 14, 15, 16, 20, 21, 22, 27, 28, 29, 30, 32, 33], "now": [0, 2, 5, 9, 14, 15, 20, 21, 22, 23, 26, 28, 29, 30, 32], "includ": [0, 1, 2, 3, 4, 5, 7, 8, 11, 12, 13, 14, 19, 20, 21, 22, 27, 28, 29, 33], "note": [0, 3, 6, 11, 13, 14, 22, 28, 29, 32], "advanc": [0, 7, 19, 20, 21, 26], "user": [0, 2, 3, 5, 6, 7, 13, 14, 15, 24, 27, 28, 32], "If": [0, 1, 2, 3, 5, 6, 8, 11, 13, 15, 22, 27, 28, 29, 32, 33], "train": [0, 2, 3, 5, 6, 7, 13, 14, 15, 27, 28], "model": [0, 2, 3, 5, 6, 7, 13, 15, 16, 17, 19, 20, 27], "definit": [0, 2, 4, 5, 8, 13, 15, 27, 28, 32], "sexual": [0, 2, 4, 5, 21, 22, 23, 25, 26, 28, 32], "new": [0, 1, 3, 5, 7, 11, 12, 14, 15, 19, 21, 22, 23, 24, 26, 28, 29, 32, 33], "could": [0, 5, 8, 16, 23, 26, 27, 28], "us": [0, 1, 2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "help": [0, 1, 5, 7, 16, 21, 22, 23, 25, 26, 29], "prepar": [0, 7, 10, 13, 19, 21, 22, 23, 25, 26], "would": [0, 2, 5, 7, 8, 9, 15, 21, 22, 23, 33], "first": [0, 2, 3, 4, 5, 7, 8, 9, 11, 12, 14, 15, 16, 19, 20, 21, 22, 23, 26, 27, 28, 29, 30, 32], "your": [0, 3, 4, 5, 6, 8, 9, 13, 15, 20, 23, 27, 28, 29, 30, 32, 33], "fine": [0, 14, 17, 19, 23], "tune": [0, 14, 17, 19], "Then": [0, 2, 5, 8, 11, 12, 14, 15, 21, 22, 23, 27, 28, 30, 32, 33], "when": [0, 3, 8, 15, 16, 20, 21, 22, 23, 25, 26, 27, 28, 29, 32], "s": [0, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 26, 27, 28, 29, 30, 32, 33], "never": [0, 29], "seen": [0, 10, 21, 26, 29, 31], "befor": [0, 2, 3, 5, 7, 14, 15, 16, 21, 23, 26, 28, 29, 32, 33], "automat": [0, 8, 21, 22], "appli": [0, 3, 26, 27], "rule": [0, 1, 7, 11, 12, 21, 26], "an": [0, 2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 14, 15, 16, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33], "see": [0, 1, 2, 3, 5, 6, 8, 9, 10, 11, 12, 14, 15, 16, 19, 20, 21, 22, 23, 24, 26, 27, 28, 29, 31, 32, 33], "dr": 0, "mattingli": [0, 19], "excel": [0, 16, 27], "tutori": [0, 1, 24], "subject": [0, 3, 4, 5, 9, 25, 27, 28], "load": [0, 2, 3, 5, 6, 8, 11, 12, 13, 16, 17, 21, 32], "up": [0, 2, 3, 5, 8, 9, 11, 12, 13, 15, 16, 19, 21, 28, 29, 30, 32, 33], "librari": [0, 1, 2, 3, 5, 7, 9, 10, 11, 16, 17, 19, 27, 28, 30, 31, 32, 33], "spaci": [0, 1, 2, 5, 6, 7, 19], "request": [0, 2, 5, 8, 11, 12, 19, 28, 30, 31, 32, 33], "en_core_web_sm": [0, 2, 3, 5, 6], "caladof": [0, 2, 3, 5, 6, 13, 15], "anaconda3": [0, 2, 3, 5, 6, 12, 13], "lib": [0, 2, 3, 5, 6, 12, 13], "python3": [0, 2, 3, 5, 6, 12, 13], "11": [0, 2, 3, 5, 6, 9, 11, 12, 13, 28, 30], "site": [0, 2, 3, 5, 6, 12, 13, 27, 28, 32], "packag": [0, 2, 3, 5, 6, 12, 13, 28, 33], "util": [0, 2, 3, 5, 6, 12], "py": [0, 2, 3, 5, 6, 12, 13], "910": [0, 2, 3, 5, 6], "userwarn": [0, 2, 3, 5, 6, 13], "w095": [0, 2, 3, 5, 6], "5": [0, 2, 3, 5, 6, 8, 9, 11, 12, 19, 20, 21, 22, 23, 25, 26, 28, 30, 32], "0": [0, 2, 3, 5, 6, 9, 11, 12, 13, 15, 16, 19, 21, 28, 30, 32], "wa": [0, 2, 3, 5, 6, 8, 9, 11, 12, 15, 16, 21, 26, 27], "v3": [0, 2, 3, 5, 6], "mai": [0, 2, 3, 5, 6, 8, 11, 12, 19, 20, 21, 26, 27, 28, 29, 32], "100": [0, 2, 3, 5, 6, 8, 9, 13, 21, 28, 30, 32], "compat": [0, 2, 3, 5, 6], "current": [0, 2, 3, 4, 5, 6, 10, 15, 19, 21, 23, 28, 33], "version": [0, 2, 3, 5, 6, 27], "7": [0, 2, 3, 5, 6, 9, 11, 12, 28, 30], "error": [0, 2, 3, 5, 6, 11, 12, 20], "degrad": [0, 2, 3, 5, 6], "perform": [0, 2, 3, 5, 6, 16, 17, 28, 32], "download": [0, 1, 2, 3, 5, 6, 9, 11, 12, 14, 15, 16, 30], "newer": [0, 2, 3, 5, 6], "retrain": [0, 2, 3, 5, 6], "detail": [0, 2, 3, 5, 6, 14, 19, 21, 23, 27, 28], "avail": [0, 2, 3, 5, 6, 21, 22, 23, 25, 26, 27], "updat": [0, 2, 3, 5, 6, 12, 13, 27, 28], "python": [0, 1, 2, 3, 5, 6, 7, 8, 10, 11, 12, 15, 17, 20, 21, 22, 24, 25, 26, 28, 31, 32, 33], "m": [0, 2, 3, 4, 5, 6, 11, 15, 19, 27, 28, 29, 32], "valid": [0, 2, 3, 5, 6], "warn": [0, 2, 3, 5, 6, 12, 13, 15], "warn_msg": [0, 2, 3, 5, 6], "anytim": 0, "mention": [0, 20], "let": [0, 2, 5, 7, 8, 9, 11, 14, 15, 20, 21, 22, 23, 25, 26, 28, 32], "try": [0, 6, 9, 13, 14, 21, 22, 23, 27, 29], "separ": [0, 3, 11, 12, 21, 22, 28, 32], "term": [0, 2, 4, 5, 6, 7, 11, 15, 27, 28, 31, 32], "list": [0, 2, 3, 4, 6, 7, 8, 9, 11, 12, 14, 15, 16, 20, 22, 23, 26, 27, 28, 30, 32, 33], "syntax": [0, 1, 9, 21, 23, 24, 26, 28, 30, 31, 32], "json": [0, 5, 13, 30, 33], "format": [0, 3, 5, 6, 8, 9, 10, 11, 12, 19, 20, 21, 26, 27, 30, 32, 33], "match": [0, 2, 7, 22, 33], "The": [0, 2, 3, 4, 5, 6, 8, 10, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33], "orient": [0, 2, 4, 5, 19, 26, 28, 31, 32], "catch": [0, 2, 5], "tran": [0, 3, 5, 19, 28, 29], "nonbinari": [0, 5, 12], "biolog": [0, 2, 4, 5, 13, 28, 32], "queer": [0, 5], "ident": [0, 2, 4, 5, 10, 28, 31], "lgbtq": [0, 4, 5, 12, 27], "lgbt": [0, 5], "lgbtqia": [0, 5, 12], "entityrul": [0, 5], "object": [0, 4, 5, 7, 11, 12, 15, 19, 20, 21, 23, 25, 30, 32, 33], "add_pip": [0, 5], "entity_rul": [0, 5], "need": [0, 2, 11, 13, 14, 16, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32, 33], "add_pattern": [0, 5], "check": [0, 9, 11, 12, 15, 19, 22, 26, 27, 28, 32], "pipe_nam": 0, "tok2vec": 0, "tagger": [0, 3], "parser": [0, 3, 6, 12, 28, 33], "attribute_rul": 0, "lemmat": 0, "rememb": [0, 2, 8, 21, 22, 23, 27, 28, 32], "ensur": [0, 9, 12, 13, 28], "contain": [0, 3, 4, 7, 9, 12, 14, 15, 16, 20, 21, 22, 23, 27, 28, 29, 31, 32, 33], "ha": [0, 3, 4, 5, 8, 9, 11, 12, 13, 15, 16, 20, 21, 26, 27, 28, 30, 32, 33], "chanc": 0, "sampl": [0, 2, 5, 8, 11, 29], "million": [0, 2, 5], "charact": [0, 2, 5, 8, 12, 20, 21, 23, 26], "clean": [0, 2, 5, 6, 10, 11, 14, 19, 22, 23, 30, 31, 32], "sourc": [0, 2, 5, 8, 12, 14, 16, 25, 27, 28, 33], "get": [0, 2, 3, 4, 5, 8, 9, 11, 12, 13, 14, 15, 16, 20, 21, 27, 29, 30, 32, 33], "http": [0, 2, 3, 5, 6, 8, 9, 11, 12, 27, 28, 29, 30, 32, 33], "bit": [0, 2, 3, 5, 8, 9, 12, 15, 16, 21, 23, 26, 32, 33], "ly": [0, 2, 5, 8, 9, 12], "senate_117_bills_clean": [0, 2, 5], "content": [0, 1, 2, 5, 8, 11, 12, 21, 24, 28, 32], "decod": [0, 2, 5, 8, 12], "utf": [0, 2, 5, 8, 11, 12], "8": [0, 2, 5, 6, 8, 9, 11, 12, 13, 28, 30, 32], "doc": [0, 1, 2, 5, 6, 8, 11, 12, 13, 24, 28], "500000": [0, 2, 5], "extract": [0, 1, 7, 12, 15, 19, 25, 27, 31, 32, 33], "ent": [0, 3], "60": [0, 6, 9, 28], "label_": [0, 3], "u": [0, 2, 4, 8, 11, 12], "govern": [0, 2, 8, 11, 12, 28, 30, 32], "publish": [0, 2, 8, 11, 12, 14, 19, 27, 30, 33], "org": [0, 3, 27, 33], "senat": [0, 2, 8, 9, 11, 12, 28, 30], "IS": [0, 2], "lt": [0, 2, 8, 9, 11, 12], "gt": [0, 2, 8, 9, 11, 12], "117th": [0, 2, 8, 11, 12], "5242to": [0, 2], "cardin": 0, "THE": [0, 2, 8, 11, 12], "unit": [0, 2, 8, 9, 11, 12, 22, 27, 28], "state": [0, 2, 5, 6, 8, 9, 10, 11, 12, 13, 27, 28, 30, 31, 32], "gpe": 0, "decemb": [0, 2], "13": [0, 2, 6, 9, 11, 12, 28, 30], "2022mr": [0, 2], "collin": [0, 2], "committe": [0, 2, 8, 9, 11, 12, 28, 30], "foreignrel": [0, 2], "A": [0, 2, 4, 5, 7, 8, 9, 11, 12, 14, 16, 20, 21, 23, 26, 28, 29, 32], "hous": [0, 2, 8, 9, 11, 12, 28, 30], "america": [0, 2, 8, 11, 12], "congress": [0, 2, 4, 8, 9, 11, 12, 27, 28, 30, 31], "section": [0, 2, 3, 5, 6, 8, 11, 14, 21, 22, 27, 28, 29, 32], "law": [0, 2, 5, 11, 12, 27, 28, 30, 32], "titl": [0, 3, 8, 9, 11, 12, 27, 28, 29, 30, 32], "intern": [0, 2, 4, 5, 8, 11, 12, 15, 19], "violenc": [0, 2, 12, 16, 21, 22, 23, 25, 26, 28], "against": [0, 2, 4, 23, 27, 28, 32], "women": [0, 2, 5, 28], "act": [0, 2, 8, 9, 11, 12, 16, 28, 30, 32], "product": [0, 2, 5, 14, 20], "sec": [0, 8, 12], "strategi": [0, 13, 15], "TO": [0, 12], "prevent": [0, 2, 8, 10, 11, 12, 20, 28, 31, 32], "basedviol": 0, "101": [0, 6, 9], "201": [0, 2, 9], "202": [0, 2, 5, 9], "203": [0, 9], "204": [0, 9], "estim": 0, "70": [0, 6, 9], "percent": 0, "swaziland": 0, "tanzania": 0, "zimbabw": 0, "kenya": 0, "haiti": 0, "between": [0, 2, 4, 5, 6, 7, 11, 13, 14, 16, 20, 21, 22, 26, 28, 30, 31, 32, 33], "28": [0, 6, 9, 28], "38": [0, 6, 9], "9": [0, 6, 9, 11, 12, 22, 28, 30], "18": [0, 6, 8, 9, 11, 12, 28], "year": [0, 4, 10, 12, 26, 28, 31, 32], "6": [0, 2, 5, 6, 9, 11, 12, 22, 28, 30], "men": [0, 2, 5], "equal": [0, 22, 27, 28], "survei": 0, "three": [0, 5, 13, 28, 29, 32, 33], "world": [0, 3, 11, 12, 15, 16, 20, 28], "health": [0, 2, 6, 12, 28], "organ": [0, 4, 11, 12, 20, 21, 24, 27, 28], "than": [0, 2, 5, 10, 11, 12, 16, 22, 27, 28, 31, 33], "50": [0, 6, 9, 13, 15, 27, 28, 30], "four": [0, 2, 8, 28, 32], "fold": 0, "also": [0, 2, 3, 4, 5, 7, 9, 11, 12, 14, 16, 20, 21, 22, 23, 26, 27, 28, 29, 33], "have": [0, 1, 2, 5, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20, 21, 26, 27, 28, 29, 30, 31, 32, 33], "again": [0, 12, 14, 21, 28], "20": [0, 6, 9, 11, 12, 28], "300": [0, 12, 28, 32], "500": [0, 10, 28, 31], "In": [0, 2, 3, 5, 6, 7, 8, 10, 11, 12, 13, 16, 20, 21, 22, 23, 26, 27, 28, 29, 30, 31, 32, 33], "next": [0, 2, 3, 5, 12, 20, 21, 22, 27, 29, 30, 31, 32], "leverag": [0, 3, 5, 7, 20], "sophist": 0, "matcher": [0, 2], "class": [0, 5, 9, 11, 21, 22, 23, 25, 26, 28, 29, 30, 32], "welcom": [1, 9, 17], "text": [1, 2, 3, 4, 5, 6, 9, 10, 12, 13, 14, 15, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 30, 31, 32], "analysi": [1, 2, 3, 4, 5, 10, 11, 16, 19, 23, 25, 27, 31], "introduc": [1, 2, 8, 10, 11, 12, 16, 17, 19, 21, 23, 24, 26, 30, 31], "search": [1, 3, 7, 9, 11, 12, 14, 15, 27, 28, 33], "pattern": [1, 2, 3, 4, 7, 19, 21, 22, 23, 25, 26], "build": [1, 4, 7, 10, 17, 19, 22, 28], "skill": [1, 19, 21, 22], "previou": [1, 4, 5, 8, 10, 11, 12, 13, 17, 19, 22, 32], "basic": [1, 5, 6, 8, 10, 13, 19, 24, 27, 31], "gather": [1, 2, 5, 7, 11, 19, 27, 30, 31, 32], "web": [1, 11, 12, 15, 19, 22, 26, 27, 28, 29, 30, 31, 32], "scrape": [1, 8, 14, 19, 22, 26, 27, 28, 30, 31], "toward": [1, 4, 12], "explor": [1, 4, 7, 9, 14, 16, 17, 19, 24, 31, 33], "textual": [1, 7, 19, 21], "although": [1, 27], "materi": [1, 19, 28], "follow": [1, 2, 3, 5, 8, 9, 11, 12, 13, 15, 16, 21, 26, 27, 28, 29, 32, 33], "along": [1, 15, 32], "concept": [1, 3, 7, 15, 16, 17, 19, 21, 23, 26], "design": [1, 4, 5, 28, 32], "programm": [1, 21, 22, 23, 26, 32], "all": [1, 2, 3, 5, 8, 9, 11, 12, 13, 20, 22, 23, 26, 27, 28, 30, 32], "level": [1, 15, 19, 22, 23, 28, 29], "total": [1, 2, 6, 9, 11, 14, 27, 30, 31], "beginn": [1, 11, 19, 20, 22, 31, 33], "particip": [1, 10, 17, 19, 28, 31, 32], "high": [1, 17, 28], "understand": [1, 2, 4, 5, 16, 20, 21, 22, 23, 25, 26, 27], "stage": 1, "familiar": 1, "natur": [1, 4, 5, 7, 15, 16, 19], "languag": [1, 3, 4, 6, 7, 13, 14, 16, 19, 20, 24, 27, 28, 29, 31, 32], "nlp": [1, 2, 3, 5, 16, 19], "some": [1, 2, 3, 4, 6, 7, 8, 9, 14, 15, 16, 21, 23, 24, 26, 27, 28, 30, 32, 33], "popular": [1, 3, 7, 16, 19, 21, 23, 27, 28, 33], "task": [1, 14, 15, 19, 32], "entiti": [1, 5, 7, 27, 28, 32], "practic": [1, 2, 10, 11, 14, 15, 16, 19, 21, 22, 23, 25, 26, 28, 31, 32], "write": [1, 3, 4, 7, 8, 10, 11, 12, 15, 19, 20, 21, 22, 23, 28, 30, 32], "read": [1, 2, 6, 8, 9, 12, 20, 21, 23, 25, 26, 28, 30, 32], "seri": [1, 3, 9, 16, 17, 33], "continu": [1, 8, 11, 12, 15, 30], "browser": [1, 24, 27, 29, 30, 31, 33], "base": [1, 3, 4, 7, 10, 12, 14, 16, 20, 21, 22, 24, 28, 31, 32, 33], "tool": [1, 7, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 29, 31], "run": [1, 3, 6, 8, 12, 14, 17, 19, 21, 22, 23, 24, 26, 27, 32], "code": [1, 3, 4, 6, 7, 8, 9, 12, 14, 15, 16, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33], "offer": [1, 3, 4, 9, 11, 12, 14, 19, 21, 24, 27, 28], "cloud": [1, 3, 7, 24], "environ": [1, 3, 15, 29], "author": [1, 24, 25, 28, 32], "much": [1, 5, 9, 16, 30], "mean": [1, 2, 4, 5, 6, 7, 9, 13, 15, 16, 20, 21, 22, 23, 25, 26, 27, 28], "without": [1, 4, 5, 21, 27, 28, 32, 33], "instal": [1, 3, 13, 15, 24, 33], "pleas": [1, 15, 19, 24, 29], "specif": [1, 2, 3, 5, 7, 11, 15, 16, 19, 20, 21, 23, 24, 26, 28, 31, 33], "allow": [2, 4, 5, 11, 16, 21, 22, 26, 27, 28, 32, 33], "sequenc": [2, 13, 15, 20, 21], "realli": [2, 3, 21, 23, 24], "alreadi": [2, 8, 15, 16, 20, 26, 27, 30, 32], "know": [2, 3, 4, 15, 16, 21, 23, 26, 28], "kind": [2, 3, 4, 5, 7, 11, 12, 14, 16, 20, 22, 25, 26], "thing": [2, 8, 10, 11, 14, 15, 16, 20, 21, 22, 23, 25, 26, 27, 32], "variat": [2, 5, 16], "those": [2, 4, 7, 8, 10, 11, 12, 16, 27, 28, 29, 31, 32], "But": [2, 3, 11, 20, 21, 22, 26, 27], "so": [2, 3, 4, 5, 7, 8, 11, 13, 14, 15, 16, 20, 21, 22, 26, 27, 28, 30, 32, 33], "account": [2, 11, 12, 13, 16, 21, 22, 23, 25, 26, 28, 30], "few": [2, 4, 14, 20, 21, 23, 26, 30, 33], "wai": [2, 3, 4, 8, 10, 11, 13, 14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33], "handl": [2, 12, 27, 32], "complex": [2, 14, 20, 27], "token": [2, 13, 15, 22], "involv": [2, 5, 7, 11, 16, 27, 28, 30], "divid": 2, "below": [2, 3, 4, 5, 8, 9, 16, 19, 27, 28, 29, 32, 33], "close": [2, 7, 8, 12, 16, 28], "saw": [2, 23], "least": [2, 28], "singl": [2, 5, 6, 11, 21, 28], "quot": [2, 5, 8, 12, 20, 21, 22], "form": [2, 3, 5, 9, 16, 21, 22, 23, 25, 26, 33], "backtick": 2, "requir": [2, 4, 8, 11, 12, 16, 21, 24, 28, 32, 33], "narrow": [2, 5, 14, 28, 32], "most": [2, 6, 7, 11, 12, 13, 14, 16, 19, 20, 21, 23, 24, 26, 27, 28, 32, 33], "common": [2, 12, 19, 20, 21, 26, 28, 32, 33], "element": [2, 7, 8, 9, 19, 25, 27, 28, 29, 32, 33], "appear": [2, 4, 5, 7, 21, 27, 28, 29, 32, 33], "i": [2, 3, 4, 5, 6, 9, 11, 12, 13, 15, 20, 21, 22, 23, 28, 29, 30, 32, 33], "am": [2, 4, 5], "leav": 2, "everyth": [2, 20, 21, 28, 32], "becaus": [2, 3, 14, 16, 20, 21, 22, 23, 27, 28, 32, 33], "sometim": [2, 16], "thei": [2, 3, 4, 5, 7, 10, 11, 13, 16, 17, 19, 21, 22, 23, 25, 26, 27, 28, 29, 31, 32, 33], "doubl": [2, 4, 5, 12], "possibl": [2, 4, 6, 15, 16, 23, 27, 28], "our": [2, 3, 4, 5, 7, 9, 12, 13, 14, 15, 20, 21, 22, 23, 26, 30, 31], "therefor": [2, 21, 26], "necessari": [2, 3, 13, 15, 32], "english": [2, 3], "add": [2, 3, 5, 8, 11, 12, 13, 16, 19, 20, 21, 22, 23, 28, 30, 32], "vocab": [2, 5, 6, 13], "each": [2, 3, 4, 6, 8, 9, 11, 12, 14, 16, 19, 20, 21, 22, 23, 26, 27, 28, 30, 33], "one": [2, 3, 4, 5, 7, 8, 14, 16, 19, 20, 21, 22, 23, 26, 27, 28, 30, 32, 33], "numer": [2, 11, 21], "convert": [2, 12, 13], "plain": [2, 5, 12, 30], "string": [2, 3, 5, 8, 10, 12, 20, 21, 22, 26], "final": [2, 5, 8, 12, 15, 17, 20, 22, 27, 32], "type": [2, 5, 6, 7, 9, 11, 12, 13, 14, 15, 19, 21, 22, 23, 24, 26, 28, 32], "byte": [2, 12], "function": [2, 3, 6, 10, 11, 12, 13, 15, 19, 22, 23, 24, 28, 32], "slice": [2, 8, 12, 22, 28], "around": [2, 7, 11, 12, 29], "memori": [2, 9, 11, 12, 21, 30], "constraint": [2, 5], "b": [2, 4, 5, 6, 8, 9, 11, 12, 28, 29], "congression": [2, 8, 11, 12], "congressfrom": [2, 8, 12], "offic": [2, 5, 8, 11, 12, 27, 28], "5242": 2, "congress2d": 2, "session": [2, 8, 11, 12, 19, 22, 28], "otherpurpos": [2, 8, 12], "IN": [2, 5, 8, 9, 11, 12, 28], "OF": [2, 8, 11], "shaheen": 2, "herself": 2, "ms": [2, 28, 32], "twice": [2, 9, 12], "refer": [2, 8, 9, 11, 12, 19, 20, 26, 27, 28, 30], "To": [2, 4, 7, 8, 10, 11, 12, 13, 15, 16, 20, 21, 22, 23, 26, 27, 28, 29, 30, 32, 33], "Be": [2, 8, 11, 12, 27], "enact": [2, 8, 11, 12, 28, 30], "assembl": [2, 8, 11, 12, 28], "len": [2, 5, 6, 11, 12], "86025": 2, "10": [2, 5, 6, 9, 11, 12, 21, 22, 23, 28, 30, 32], "hash": 2, "start": [2, 4, 5, 8, 14, 20, 21, 28, 29, 31, 32, 33], "locat": [2, 21, 28], "5344954752463023658": 2, "2287": 2, "2289": 2, "4384": 2, "4386": 2, "7828": 2, "7830": 2, "8041": 2, "8043": 2, "8169": 2, "8171": 2, "8340": 2, "8342": 2, "8463": 2, "8465": 2, "8470": 2, "8472": 2, "8490": 2, "8492": 2, "8501": 2, "8503": 2, "mani": [2, 4, 5, 8, 13, 14, 16, 20, 22, 24, 27, 33], "got": [2, 11, 15, 30], "72": [2, 9, 28], "consist": [2, 16, 21, 28, 33], "numerica": 2, "posit": [2, 7, 21, 28, 32], "actual": [2, 4, 5, 13, 16, 28, 32], "sent": [2, 5], "attribut": [2, 5, 14, 19, 29, 32], "socioeconom": [2, 5], "quantit": [2, 5], "qualit": [2, 5], "inform": [2, 3, 4, 5, 10, 15, 20, 27, 28, 29, 30, 31, 33], "identifi": [2, 5, 8, 23, 27, 28], "explain": [2, 5, 20, 21, 23, 27, 28, 32, 33], "gap": [2, 5, 28, 32], "typic": [2, 5, 27], "examin": [2, 4, 5, 27, 28, 29, 30], "differ": [2, 5, 7, 13, 14, 15, 16, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 31, 32, 33], "statu": [2, 5], "differenti": [2, 5, 21, 22, 23, 25, 26], "access": [2, 3, 4, 5, 9, 10, 12, 21, 27, 28, 30, 31, 33], "control": [2, 5, 13, 21, 22, 23, 25, 26, 28], "over": [2, 4, 5, 11, 13, 14, 21, 22, 23, 25, 26, 28, 33], "asset": [2, 5], "resourc": [2, 5, 28], "educ": [2, 5, 9, 12, 28, 32], "opportun": [2, 4, 5, 21, 27, 28, 32], "servic": [2, 5, 9, 12, 21, 22, 23, 25, 26, 27, 28], "ii": [2, 5], "influenc": [2, 5, 11, 12], "role": [2, 4, 5, 11, 12, 28], "structur": [2, 5, 9, 10, 15, 22, 24, 30, 32, 33], "barrier": [2, 5], "norm": [2, 5], "divis": [2, 5, 28], "paid": [2, 5, 28], "unpaid": [2, 5], "work": [2, 5, 7, 8, 9, 10, 11, 12, 13, 15, 16, 17, 20, 21, 22, 23, 24, 25, 26, 27, 28, 31, 32, 33], "subsist": [2, 5], "care": [2, 5, 12, 28], "famili": [2, 5, 14, 28, 32], "member": [2, 5, 8, 11, 12, 28], "volunt": [2, 5], "activ": [2, 4, 5, 15, 28, 32], "iii": [2, 5], "leadership": [2, 5], "decis": [2, 5, 20, 22, 28], "make": [2, 3, 4, 5, 8, 11, 12, 13, 14, 16, 20, 21, 22, 23, 25, 26, 27, 28, 30, 31, 32, 33], "entri": [2, 5, 9, 11, 30], "point": [2, 5, 20, 21, 31], "empow": [2, 5], "iv": [2, 5], "potenti": [2, 4, 5, 15, 27], "impact": [2, 5, 14], "develop": [2, 4, 5, 11, 12, 14, 15, 16, 28, 29], "polici": [2, 5, 8, 11, 12, 28, 32], "program": [2, 3, 5, 7, 15, 19, 21, 22, 24, 26, 28, 31, 32, 33], "unintend": [2, 5], "neg": [2, 5, 7, 28], "consequ": [2, 5], "conclus": [2, 5], "recommend": [2, 5], "enabl": [2, 3, 5, 7, 21, 22, 24, 26, 28, 30, 32, 33], "improv": [2, 5, 8], "live": [2, 5, 12, 21, 22, 23, 25, 26, 28, 29], "girl": [2, 5, 28], "global": [2, 5, 28], "issu": [2, 5, 14, 27], "establish": [2, 5, 8, 11, 12, 28], "secretari": [2, 5, 6, 11, 12, 28], "pursuant": [2, 5], "whole": [2, 13, 20, 27], "sentenc": [2, 3, 5, 20, 22, 25, 28], "n": [2, 5, 8, 9, 11, 12, 13, 30], "reassign": [2, 9, 28], "medic": [2, 4, 5, 12, 28, 32], "intervent": [2, 28], "purpos": [2, 5, 8, 11, 12, 14, 27, 28], "chapter": [2, 5, 28], "surgeri": [2, 5, 28], "steril": 2, "individu": [2, 3, 4, 5, 6, 11, 23, 26, 28, 30, 33], "castrat": 2, "vasectomi": 2, "hysterectomi": 2, "oophorectomi": 2, "metoidioplasti": 2, "penectomi": 2, "phalloplasti": 2, "vaginoplasti": 2, "chang": [2, 5, 8, 11, 12, 15, 21, 27, 28, 32], "bodi": [2, 4, 8, 11, 12, 21, 22, 23, 25, 26, 28, 29], "correspond": [2, 5, 28], "discord": 2, "mastectomi": 2, "describ": [2, 3, 4, 20, 26, 27, 33], "paragraph": [2, 6, 26, 28], "administ": [2, 28], "suppli": 2, "public": [2, 4, 27, 28, 30, 32, 33], "accommod": [2, 28], "prohibit": [2, 27, 28, 32], "discrimin": [2, 4, 14, 27, 28], "segreg": 2, "civil": [2, 11, 12, 28], "right": [2, 4, 5, 10, 11, 12, 13, 14, 15, 24, 27, 28, 29, 31, 32, 33], "1964": 2, "42": [2, 6, 9], "c": [2, 4, 11, 12], "2000a": 2, "amend": [2, 9, 11, 12, 28, 30, 32], "subsect": [2, 6, 28], "insert": [2, 12, 21, 22, 29, 30], "nation": [2, 8, 9, 11, 12, 21, 22, 23, 25, 26, 27], "origin": [2, 12, 13, 16, 20, 21, 28], "strike": [2, 6], "stadium": 2, "other": [2, 3, 4, 5, 6, 7, 8, 11, 12, 13, 14, 16, 19, 20, 21, 22, 23, 25, 26, 27, 28, 31, 32], "provid": [2, 15, 27, 28, 29, 30, 32], "exhibit": 2, "entertain": 2, "recreat": 2, "exercis": 2, "amus": 2, "displai": [2, 23, 28, 32], "redesign": 2, "ani": [2, 4, 5, 6, 9, 12, 13, 21, 22, 23, 25, 26, 27, 28, 32], "good": [2, 5, 12, 27, 32], "store": [2, 26, 30], "shop": 2, "center": [2, 19, 27, 28, 32], "onlin": [2, 27, 33], "retail": 2, "salon": 2, "bank": [2, 9, 12], "ga": [2, 28], "station": 2, "food": 2, "shelter": [2, 12, 28], "travel": 2, "agenc": [2, 21, 22, 23, 25, 26, 28], "funer": 2, "parlor": 2, "legal": [2, 5, 19, 28, 31], "bu": 2, "car": 2, "taxi": 2, "airlin": 2, "depot": 2, "transport": 2, "under": [2, 5, 6, 12, 16, 19, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32], "desegreg": 2, "facil": [2, 28], "301": 2, "2000b": 2, "feder": [2, 5, 6, 9, 12, 27, 28, 32], "fund": [2, 28], "601": 2, "2000d": 2, "unlaw": [2, 28], "employ": [2, 28], "703": 2, "2000e": 2, "header": [2, 9, 12, 28], "except": [2, 5, 26, 28], "e": [2, 13, 22, 23], "enterpris": [2, 28], "situat": 2, "bona": 2, "fide": 2, "occup": [2, 28], "qualif": 2, "recogn": [2, 9, 12, 26, 30], "qualifi": 2, "accord": [2, 4, 5, 10, 12, 19, 21, 27, 28, 31], "h": [2, 8, 9, 11, 12, 22, 23], "second": [2, 15, 16, 19, 21, 22, 23, 26, 27, 29, 30, 32], "704": 2, "ve": [2, 15, 21, 22, 23, 27, 32], "lot": [2, 3, 8, 14, 16, 21, 22, 29], "even": [2, 4, 7, 14, 16, 20, 21, 26, 27, 31, 33], "what": [2, 3, 4, 5, 8, 11, 12, 13, 14, 15, 16, 19, 20, 21, 22, 23, 26, 29, 31], "save": [2, 3, 5, 8, 9, 11, 12, 13, 15, 21, 22, 23, 24, 26, 28, 30, 33], "file": [2, 3, 5, 6, 8, 9, 11, 12, 13, 22, 27, 28, 29, 30, 32, 33], "empti": [2, 8, 11, 12, 22, 23, 28, 32], "def": [2, 6, 8, 11, 12], "loop": [2, 9, 11, 12, 19, 30, 32], "append": [2, 6, 11, 12, 21, 22, 23, 25, 26, 27, 28, 30, 32], "f": [2, 3, 5, 6, 8, 11, 12, 30], "call": [2, 3, 6, 7, 8, 11, 12, 13, 14, 15, 16, 20, 22, 23, 24, 26, 27, 28, 30, 32], "open": [2, 5, 6, 8, 11, 12, 14, 16, 19, 22, 27, 28, 29, 32, 33], "txt": [2, 5, 6, 8, 11, 12, 13, 27], "w": [2, 5, 6, 8, 11, 12], "item": [2, 8, 9, 11, 12, 15, 20, 21, 22, 23, 25, 28, 30, 32, 33], "str": [2, 5, 6, 11, 12, 20, 30], "googl": [3, 9, 15, 16, 32], "colab": [3, 9, 32], "nor": [3, 28, 32], "local": [3, 12, 28], "comput": [3, 6, 7, 13, 14, 16, 17, 19, 20, 21, 22, 23, 25, 26, 28, 29, 33], "distribut": [3, 6, 27, 28], "anaconda": 3, "io": [3, 5, 6, 12], "usag": [3, 9, 11, 30], "power": [3, 16, 20, 21, 22, 23, 25, 26, 28, 33], "capabl": [3, 21], "It": [3, 4, 7, 8, 9, 11, 12, 14, 16, 21, 22, 24, 27, 28, 32, 33], "tag": [3, 12, 28, 29, 32], "creator": 3, "annot": [3, 19, 28], "fill": [3, 28], "linguist": [3, 7], "about": [3, 4, 7, 8, 9, 14, 15, 16, 19, 20, 21, 22, 23, 25, 26, 27, 28, 29, 31, 33], "punctuat": [3, 5, 20, 21], "grammat": 3, "claus": 3, "span": [3, 5, 28, 32], "doe": [3, 5, 6, 7, 8, 14, 16, 21, 22, 26, 27, 28, 32], "piec": [3, 8], "statist": [3, 7, 20, 28], "predict": [3, 6, 7, 16, 17], "been": [3, 4, 7, 9, 15, 16, 23, 27, 28], "lexic": 3, "princeton": [3, 16, 17, 19, 27, 33], "wordnet": 3, "root": [3, 27, 28, 30, 32, 33], "lookup": 3, "tabl": [3, 9, 28], "featur": [3, 4, 5, 7, 15, 19, 28], "come": [3, 8, 20, 21, 23, 26, 28, 30, 33], "across": [3, 4, 7, 10, 16, 27, 28, 31], "adject": 3, "prefix": [3, 12], "shorten": 3, "longer": [3, 16, 23], "transgend": [3, 4, 11, 12, 27, 28, 30], "guess": [3, 13, 14, 20], "categor": [3, 7, 24], "particular": [3, 7, 8, 9, 16, 20, 21, 27, 28], "aspect": [3, 4, 5], "surround": [3, 16, 20], "demonstr": [3, 27], "lanugag": [3, 28], "3": [3, 5, 6, 8, 9, 11, 12, 13, 19, 21, 22, 23, 25, 26, 28, 30], "2": [3, 6, 8, 9, 11, 12, 13, 16, 19, 21, 22, 23, 25, 26, 28, 30], "speak": [3, 7, 8, 16, 20, 21], "case": [3, 6, 11, 13, 22, 23, 26, 27, 28, 31, 33], "my": [3, 4, 7, 12, 15, 27, 33], "filipa": [3, 9, 15, 19, 26], "teach": 3, "workshop": [3, 4, 16, 20, 21, 22, 23, 25, 26, 28, 30, 32, 33], "univers": [3, 19, 27, 28, 33], "happen": [3, 13, 19, 21], "goe": [3, 5, 8, 9, 11, 14, 21, 22, 23, 32], "pars": [3, 28, 30, 31], "long": [3, 13, 22, 23, 26], "document": [3, 5, 6, 28, 29], "amen": 3, "count": [3, 9, 11, 21, 28, 30], "print": [3, 6, 9, 12, 21, 22, 23, 25, 28, 30, 32], "lower_": 3, "lemma_": 3, "noun": 3, "verb": 3, "adverb": 3, "preposit": 3, "deriv": 3, "its": [3, 4, 8, 11, 12, 15, 16, 20, 21, 22, 23, 25, 26, 27, 28, 33], "predic": 3, "might": [3, 4, 20, 21, 23, 33], "seem": [3, 21, 26], "excess": 3, "later": [3, 4, 5, 8, 11, 12, 13, 15, 26, 28, 29, 32], "becom": [3, 5, 16, 20, 21, 23, 26], "select": [3, 13, 15, 27, 28, 29, 32], "onli": [3, 4, 6, 9, 11, 13, 16, 21, 22, 26, 27, 28, 32], "pos_": 3, "dep_": 3, "pron": 3, "poss": 3, "nsubj": 3, "aux": 3, "propn": 3, "attr": [3, 6, 28], "punct": 3, "cconj": 3, "cc": 3, "conj": 3, "dobj": 3, "adp": 3, "prep": 3, "compound": 3, "pobj": 3, "do": [3, 4, 5, 7, 8, 9, 10, 11, 14, 15, 16, 20, 21, 22, 23, 24, 26, 27, 28, 29, 32], "someth": [3, 4, 20, 21, 22, 23, 24, 26, 27, 28, 32, 33], "similar": [3, 5, 6, 7, 16, 26], "result": [3, 4, 5, 7, 8, 9, 11, 12, 13, 14, 21, 22, 25, 27, 28, 30, 32, 33], "modul": [3, 13], "displaci": 3, "visual": [3, 7], "relationship": [3, 8, 11, 12, 16], "render": [3, 8, 11, 12, 27, 28], "style": [3, 15, 28, 29, 32], "dep": 3, "option": [3, 12, 13, 27, 28, 29], "compact": 3, "true": [3, 5, 6, 12, 15, 20, 22, 26, 28, 32, 33], "indic": [3, 4, 5, 8, 12, 13, 14, 15, 23, 26, 27, 28, 29, 30], "real": [3, 20, 25, 28], "peopl": [3, 4, 8, 10, 11, 12, 14, 20, 21, 22, 23, 25, 26, 27, 31], "monetari": [3, 27], "valu": [3, 5, 9, 15, 20, 21, 22, 25, 26, 27, 28], "made": [3, 4, 7, 13, 27, 28, 33], "underli": [3, 26], "context": [3, 4, 5, 7, 12, 16, 23], "left": [3, 14, 27, 28, 32], "po": 3, "show": [3, 11, 21, 22, 26, 27, 28, 29], "There": [4, 9, 14, 16, 20, 24, 26, 27], "neutral": 4, "specul": 4, "creativ": [4, 19], "endeavor": 4, "imagin": [4, 21], "impli": [4, 16], "assumpt": [4, 16, 21, 22, 23, 25, 26], "expect": [4, 6], "addition": [4, 27], "itself": [4, 14, 27, 32], "bring": [4, 27, 28], "frame": [4, 6, 9, 11, 30], "perspect": [4, 7], "though": [4, 20, 23, 26, 27], "often": [4, 13, 20, 25, 27, 28, 33], "feel": [4, 20], "backward": [4, 21], "recurs": 4, "progress": [4, 6, 28], "answer": [4, 7, 8, 16, 21, 22, 27], "Being": 4, "cogniz": 4, "implic": [4, 21, 22, 23, 25, 26], "crucial": [4, 21], "part": [4, 7, 11, 12, 14, 19, 21, 22, 25, 27, 28, 29, 32], "critic": [4, 19], "draw": [4, 5], "expertis": 4, "emerg": [4, 28, 32], "past": [4, 10, 13, 15, 21, 30, 31], "sever": [4, 26, 28, 32, 33], "dramat": 4, "increas": [4, 28], "limit": [4, 14, 27, 28, 32], "tracker": [4, 10, 27, 28, 29, 31], "just": [4, 5, 7, 8, 11, 12, 13, 14, 15, 16, 20, 21, 23, 27, 28, 29, 32, 33], "month": [4, 12], "2023": [4, 9, 10, 12, 27, 28, 30, 31, 32], "being": [4, 5, 7, 16, 20, 21, 22, 23, 25, 26, 27, 28, 31], "consid": [4, 14, 20, 27, 33], "countri": [4, 8, 11, 12], "block": [4, 5, 22, 28], "healthcar": [4, 10, 28, 31, 32], "affirm": [4, 13], "bathroom": [4, 10, 28, 31, 32], "ban": 4, "sport": [4, 10, 28, 31, 32], "express": [4, 9, 12, 20, 22, 24, 28], "school": [4, 28, 32], "explos": [4, 10, 31], "codifi": [4, 12], "reflect": [4, 26], "worri": 4, "trend": 4, "gener": [4, 5, 6, 7, 11, 13, 14, 15, 16, 17, 19, 20, 27, 28, 31, 32, 33], "view": [4, 27, 28, 32], "exist": [4, 7, 13, 21, 28], "interest": [4, 14, 16, 28, 32], "themselv": [4, 8, 11, 12, 27, 31, 33], "fact": 4, "cultur": [4, 5, 19, 33], "phenomena": 4, "mixtur": 4, "both": [4, 5, 26, 27, 33], "exacerb": [4, 5, 27], "collect": [4, 6, 7, 15, 20, 21, 22, 23, 24, 27, 28, 33], "goal": [4, 9, 12, 15, 17, 24, 25, 27, 30], "conflat": 4, "phenomenon": 4, "anticip": 4, "drawn": 4, "link": [4, 9, 14, 28, 29, 32, 33], "vocabulari": 4, "homosauru": 4, "variou": [4, 19, 20, 21, 28, 32], "social": [4, 5, 27, 28, 32], "construct": [4, 28, 30], "system": [4, 21, 22, 23, 25, 26, 28], "give": [4, 7, 16, 23, 26, 27, 28, 30, 33], "masculin": [4, 5], "feminin": 4, "interact": [4, 24, 30, 33], "respons": [4, 11, 12, 15, 21, 22, 23, 25, 26, 28], "physiolog": [4, 5], "sens": [4, 5, 11, 12, 15, 16, 20, 26, 28, 29, 32, 33], "self": [4, 6, 12, 13], "contrast": [4, 7, 16, 21, 26], "assign": [4, 8, 21, 22, 23, 26, 28, 30, 32], "reproduct": [4, 5, 15, 28], "usual": [4, 23, 27], "extern": [4, 5, 13, 15, 19], "anatomi": [4, 28], "chromosom": [4, 5, 15], "gene": 4, "hormon": [4, 5, 15], "effect": [4, 8, 11, 12, 27, 28, 30], "ought": 4, "spend": 4, "me": [4, 27], "contextu": [4, 7], "pull": [4, 9, 15, 32, 33], "capac": [4, 5, 15], "occur": [4, 5, 15, 21], "gonad": [4, 5, 15], "non": [4, 5, 9, 11, 14, 27, 30], "ambigu": [4, 5], "genitalia": [4, 5, 15], "present": [4, 5, 15, 27, 28], "birth": [4, 5, 15, 28], "regard": [4, 5, 13, 28], "psycholog": [4, 5], "chosen": [4, 5], "experi": [4, 5, 19], "behavior": [4, 5], "stereotyp": 4, "pregnanc": 4, "childbirth": 4, "condit": [4, 19, 20, 28], "d": [4, 5, 9, 12, 13, 27, 28, 30], "characterist": [4, 5, 27], "intersex": 4, "trait": [4, 14], "manner": [4, 5], "regardless": [4, 5, 25], "homosexu": [4, 5], "heterosexu": [4, 5], "bisexu": [4, 5], "veri": [5, 7, 13, 14, 22, 26, 27], "phrasematch": 5, "two": [5, 8, 9, 11, 16, 20, 23, 27, 28, 32], "same": [5, 9, 13, 14, 21, 22, 23, 25, 26, 27, 28], "defintit": 5, "did": [5, 11, 22], "creat": [5, 12, 13, 14, 15, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 31, 32, 33], "take": [5, 8, 11, 12, 13, 14, 15, 16, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 32], "well": [5, 8, 12, 13, 14, 21, 23, 27, 29, 32], "synonym": 5, "That": [5, 14, 20, 21, 23, 28, 30], "where": [5, 7, 14, 15, 20, 21, 23, 24, 25, 26, 27, 28, 29, 32, 33], "last": [5, 6, 8, 10, 12, 13, 21, 23, 28, 31, 32], "ruler": 5, "idea": [5, 7, 8, 20, 23], "kei": [5, 8, 9, 11, 15, 16, 30], "pair": [5, 9, 15], "page": [5, 12, 14, 15, 27, 29, 30, 31, 33], "api": [5, 6, 11, 19, 22, 27, 31, 32], "pattern_format": 5, "lower": [5, 12, 23], "is_punct": 5, "terminolog": 5, "instanc": 5, "specifi": [5, 11, 12, 15, 22, 23, 28], "ent_typ": 5, "op": [5, 6, 30], "wild": [5, 27], "card": [5, 14, 27, 28], "zero": [5, 21], "lowercas": [5, 23], "signifi": [5, 21], "mather": 5, "33": [5, 6, 9, 11, 28, 32], "match_id": 5, "string_id": 5, "represent": [5, 16], "2288": 5, "2292": 5, "9680": 5, "9684": 5, "9785": 5, "9788": 5, "11856": 5, "11861": 5, "transit": [5, 11, 12, 28, 32], "procedur": [5, 28], "surgic": [5, 28], "seek": [5, 21, 22, 23, 25, 26, 28], "alter": [5, 22, 28], "remov": [5, 6, 8, 12, 13, 14, 19, 21, 28], "anatom": 5, "instil": 5, "resembl": 5, "physician": [5, 28], "inpati": 5, "outpati": 5, "hospit": [5, 28], "prescrib": 5, "drug": 5, "puberti": 5, "cross": [5, 32], "mechan": 5, "promot": [5, 25, 28], "femin": 5, "opposit": [5, 16, 28], "Such": 5, "treatment": [5, 28], "verifi": [5, 28], "disord": [5, 28], "aa": 5, "irresolv": 5, "presenc": [5, 28], "46": [5, 6, 9, 28], "xx": 5, "viril": 5, "xy": 5, "underviril": 5, "ovarian": 5, "testicular": 5, "tissu": 5, "bb": 5, "diagnos": 5, "respect": [5, 28], "determin": [5, 8, 11, 12, 27, 28], "genet": [5, 28], "biochem": [5, 28], "test": [5, 12], "normal": [5, 21, 22, 23, 25, 26, 28, 32], "steroid": 5, "action": [5, 8, 9, 11, 12, 20, 23, 26, 27, 28, 32], "infect": 5, "injuri": 5, "diseas": 5, "caus": [5, 14, 21, 28], "whether": [5, 7, 22, 27, 33], "deduct": [5, 28], "expens": 5, "connect": 5, "12143": 5, "12146": 5, "12168": 5, "12172": 5, "hi": [5, 9, 12], "her": 5, "physic": [5, 28], "12232": 5, "12237": 5, "genit": 5, "assist": [5, 8, 9, 11, 12, 28], "12548": 5, "12552": 5, "testosteron": 5, "androgen": 5, "given": [5, 6, 13, 16, 28, 32], "dose": 5, "profoundli": 5, "larger": [5, 7, 14, 21, 28, 31, 32, 33], "potent": 5, "healthi": 5, "estrogen": 5, "12542": 5, "ix": 5, "13845": 5, "13848": 5, "nonambigu": 5, "due": [5, 7, 8, 11, 12, 27], "versatil": [5, 19], "dysphoria": [5, 28], "beyond": 5, "were": [5, 10, 11, 12, 14, 21, 22, 23, 25, 26, 27, 29, 31], "abl": [5, 21, 22, 23, 25, 26, 27, 33], "pretti": [5, 13], "cool": 5, "review": [5, 28], "full": [5, 11, 21, 22, 28, 30, 31], "matcher_def": 5, "folk": 5, "tomotopi": 6, "tp": 6, "bab2min": 6, "github": [6, 14], "v0": 6, "12": [6, 9, 11, 12, 28, 30, 32], "en": [6, 10, 23, 32], "mdl": 6, "ldamodel": 6, "k": [6, 9, 12, 28, 32], "line": [6, 8, 9, 12, 13, 21, 22, 23, 27, 28, 30, 32, 33], "117s_text_clean": 6, "add_doc": 6, "strip": [6, 12], "split": [6, 11, 12, 21, 22, 23, 25, 26, 32], "rang": [6, 21, 30], "iter": [6, 12, 13, 24, 27], "tlog": 6, "likelihood": [6, 14], "ll_per_word": 6, "log": [6, 13, 27], "053539932129096": 6, "858447764373736": 6, "74447290421813": 6, "30": [6, 9, 12], "662153702239387": 6, "40": [6, 9, 16, 28], "596505404571529": 6, "54195286414643": 6, "495335749251728": 6, "454269957649737": 6, "80": [6, 9, 28], "405036907530018": 6, "90": [6, 9, 11, 12, 16], "363642610741756": 6, "top": [6, 13, 14, 15, 28, 29, 32], "topic": [6, 7, 16, 28], "get_topic_word": 6, "top_n": 6, "05388536676764488": 6, "04434826970100403": 6, "040047500282526016": 6, "02720104530453682": 6, "02327030897140503": 6, "02238362468779087": 6, "011680571362376213": 6, "011045229621231556": 6, "010968430899083614": 6, "010507633909583092": 6, "1": [6, 8, 9, 11, 12, 13, 15, 19, 20, 21, 22, 23, 25, 26, 28, 30], "07137387245893478": 6, "028800904750823975": 6, "023578671738505363": 6, "013782079331576824": 6, "013222554698586464": 6, "011730488389730453": 6, "010002831928431988": 6, "009207718074321747": 6, "008196646347641945": 6, "00805921945720911": 6, "05497410148382187": 6, "039837151765823364": 6, "012913113459944725": 6, "01231541857123375": 6, "009952441789209843": 6, "007923061959445477": 6, "006477476097643375": 6, "006199478637427092": 6, "005546185187995434": 6, "child": [6, 12, 16, 28, 32], "00543498620390892": 6, "06894353032112122": 6, "0499117486178875": 6, "044039785861968994": 6, "03318462148308754": 6, "028740808367729187": 6, "026730364188551903": 6, "02236623503267765": 6, "01437962893396616": 6, "012608232907950878": 6, "011180083267390728": 6, "4": [6, 8, 9, 11, 12, 13, 19, 21, 22, 23, 25, 26, 28, 30, 32], "058097559958696365": 6, "048920921981334686": 6, "0377509742975235": 6, "031786952167749405": 6, "027100559324026108": 6, "020797254517674446": 6, "019758189097046852": 6, "018448755145072937": 6, "018130674958229065": 6, "016672803089022636": 6, "06665465980768204": 6, "05515214800834656": 6, "02065461315214634": 6, "01204273197799921": 6, "011262561194598675": 6, "01082246471196413": 6, "010062298737466335": 6, "009622202254831791": 6, "008021852932870388": 6, "007781800348311663": 6, "07194483280181885": 6, "054774586111307144": 6, "047234587371349335": 6, "034164249897003174": 6, "02700704336166382": 6, "025712601840496063": 6, "016727060079574585": 6, "015860741958022118": 6, "shall": [6, 9, 11, 12, 28, 32], "01526136975735426": 6, "0149390185251832": 6, "08475305140018463": 6, "047203872352838516": 6, "031947240233421326": 6, "02246880903840065": 6, "02050628699362278": 6, "01811237446963787": 6, "017383264377713203": 6, "016569091007113457": 6, "01433923002332449": 6, "01331239938735962": 6, "07536368817090988": 6, "041805367916822433": 6, "030558869242668152": 6, "025009434670209885": 6, "018768835812807083": 6, "018648050725460052": 6, "015514330938458443": 6, "013850171118974686": 6, "013709253631532192": 6, "011749840341508389": 6, "05619411543011665": 6, "04916512221097946": 6, "04034888371825218": 6, "02283008210361004": 6, "02161121740937233": 6, "021573325619101524": 6, "0160537026822567": 6, "012877077795565128": 6, "012277118861675262": 6, "012270803563296795": 6, "05778033658862114": 6, "041525308042764664": 6, "02643531747162342": 6, "012538100592792034": 6, "010799792595207691": 6, "010013855993747711": 6, "009791944175958633": 6, "008811834268271923": 6, "008349518291652203": 6, "007609813008457422": 6, "045426853001117706": 6, "04368209466338158": 6, "029611913487315178": 6, "019493717700242996": 6, "017552761361002922": 6, "016978181898593903": 6, "015408600680530071": 6, "014301484450697899": 6, "01277394499629736": 6, "011526688002049923": 6, "053602177649736404": 6, "04851926490664482": 6, "04832858592271805": 6, "03757983446121216": 6, "01673062890768051": 6, "01606598310172558": 6, "015542982146143913": 6, "015210658311843872": 6, "01467131357640028": 6, "013717927038669586": 6, "08932202309370041": 6, "058066677302122116": 6, "011682633310556412": 6, "011030647903680801": 6, "00834287516772747": 6, "0073449392803013325": 6, "007331633474677801": 6, "006852624472230673": 6, "amount": [6, 12, 16, 28], "006812707055360079": 6, "006786095444113016": 6, "14": [6, 8, 9, 11, 12, 28], "07768867164850235": 6, "04232051223516464": 6, "04065348953008652": 6, "032444097101688385": 6, "02342032454907894": 6, "02188994735479355": 6, "018238898366689682": 6, "016265802085399628": 6, "016036245971918106": 6, "015194537118077278": 6, "15": [6, 9, 11, 12, 28], "07483828812837601": 6, "047694746404886246": 6, "01961832493543625": 6, "019424837082624435": 6, "01831919327378273": 6, "014988443814218044": 6, "01482950709760189": 6, "014262865297496319": 6, "013108850456774235": 6, "012652772478759289": 6, "16": [6, 9, 11, 12, 28, 32], "05961429700255394": 6, "037866175174713135": 6, "02345755696296692": 6, "017499033361673355": 6, "010227124206721783": 6, "00961871724575758": 6, "009193798527121544": 6, "008730250410735607": 6, "008421218954026699": 6, "007919041439890862": 6, "17": [6, 9, 11, 12, 28], "05169806629419327": 6, "03995613008737564": 6, "026608508080244064": 6, "024469666182994843": 6, "023992301896214485": 6, "017650166526436806": 6, "01498436275869608": 6, "014606190845370293": 6, "014240417629480362": 6, "013949038460850716": 6, "07110285758972168": 6, "03637167066335678": 6, "015320097096264362": 6, "01122890505939722": 6, "0109945647418499": 6, "009744750335812569": 6, "00914913509041071": 6, "009051493369042873": 6, "008094603195786476": 6, "00799696147441864": 6, "19": [6, 9, 12, 28], "07225526869297028": 6, "04751206561923027": 6, "032853610813617706": 6, "03239491209387779": 6, "02474326826632023": 6, "01903943531215191": 6, "01371452771127224": 6, "013621458783745766": 6, "013156110420823097": 6, "012052572332322598": 6, "summari": [6, 9, 11, 12, 28, 30], "info": [6, 11, 30], "2767674": 6, "132815": 6, "entropi": 6, "53844": 6, "weight": [6, 28, 32], "na": 6, "burn": 6, "optim": 6, "interv": 6, "per": 6, "36364": 6, "initi": [6, 19, 27, 28], "paramet": [6, 8, 12, 13, 14, 15, 30, 33], "tw": 6, "termweight": 6, "ONE": 6, "min_cf": 6, "minimum": 6, "frequenc": 6, "min_df": 6, "rm_top": 6, "32767": 6, "alpha": 6, "hyperparamet": [6, 13], "dirichlet": 6, "float": [6, 20], "symmetr": 6, "prior": 6, "length": [6, 9, 11, 13, 15], "asymmetr": 6, "eta": 6, "01": [6, 28, 30], "seed": 6, "1119695798": 6, "random": 6, "8569565": 6, "7062378": 6, "813477": 6, "417408": 6, "1705065": 6, "6227145": 6, "5072103": 6, "4796157": 6, "085812": 6, "321555": 6, "9014735": 6, "9331636": 6, "0490155": 6, "9188871": 6, "018366": 6, "9497604": 6, "733492": 6, "393309": 6, "7279112": 6, "1359215": 6, "141902": 6, "100544": 6, "70615": 6, "161820": 6, "187303": 6, "98650": 6, "197213": 6, "163256": 6, "147696": 6, "157016": 6, "106823": 6, "141385": 6, "182228": 6, "73827": 6, "181633": 6, "143384": 6, "102221": 6, "159974": 6, "101087": 6, "149097": 6, "spacy_clean": 6, "cleaner": [6, 8, 9, 13], "remove_stopword_token": 6, "r": [6, 8, 9, 11, 12, 13], "20706436": 6, "00": [6, 13], "257": [6, 11, 12], "07": [6, 28, 30], "35": [6, 9, 16, 28], "1839": 6, "59it": 6, "769": 6, "55": [6, 9], "54": [6, 9], "2977": 6, "43it": 6, "1281": 6, "43": [6, 9, 28], "3323": 6, "05it": 6, "1793": 6, "39": [6, 9, 28], "03": [6, 28, 30], "3483": 6, "77it": 6, "2305": 6, "47": [6, 9, 28], "3602": 6, "41it": 6, "2666": 6, "37": [6, 9, 28], "23": [6, 9, 12, 28], "3543": 6, "00it": 6, "3073": 6, "31": [6, 9, 11, 28, 30], "3365": 6, "34it": 6, "3585": 6, "3523": 6, "37it": 6, "4097": 6, "34": [6, 9, 15, 26, 28], "3643": 6, "11it": 6, "4609": 6, "3689": 6, "23it": 6, "5121": 6, "56": [6, 9, 28, 30], "3752": 6, "39it": 6, "5633": 6, "32": [6, 9, 12, 28], "3739": 6, "90it": 6, "6145": 6, "3778": 6, "06it": 6, "6657": 6, "3806": 6, "02it": 6, "7169": 6, "45": [6, 9], "3800": 6, "87it": 6, "7681": 6, "02": [6, 28, 30], "3809": 6, "66it": 6, "8193": 6, "21": [6, 9, 12, 28, 30], "3817": 6, "80it": 6, "8705": 6, "3820": 6, "33it": 6, "9217": 6, "3827": 6, "9729": 6, "3793": 6, "42it": 6, "10241": 6, "52": [6, 9, 28, 32], "3796": 6, "10753": 6, "3799": 6, "89it": 6, "11265": 6, "3802": 6, "71it": 6, "11777": 6, "29": [6, 9, 13, 28], "3811": 6, "36it": 6, "12289": 6, "12801": 6, "3805": 6, "55it": 6, "13313": 6, "84it": 6, "13825": 6, "15it": 6, "14337": 6, "3782": 6, "10it": 6, "14849": 6, "04": [6, 28, 30], "57": [6, 9, 30], "3791": 6, "12it": 6, "15361": 6, "57it": 6, "15873": 6, "22": [6, 9, 28, 30], "3815": 6, "16385": 6, "3818": 6, "38it": 6, "16897": 6, "26": [6, 9, 10, 28, 31], "3812": 6, "50it": 6, "17409": 6, "3816": 6, "17921": 6, "29it": 6, "18433": 6, "3787": 6, "18945": 6, "05": [6, 28, 30], "3792": 6, "22it": 6, "19457": 6, "49": [6, 9, 28, 30], "46it": 6, "19969": 6, "03it": 6, "20481": 6, "36": [6, 9, 28, 30], "3804": 6, "20993": 6, "96it": 6, "21505": 6, "78it": 6, "21886": 6, "41": [6, 9, 28], "3801": 6, "22273": 6, "3490": 6, "22785": 6, "06": [6, 28, 30], "3588": 6, "26it": 6, "23297": 6, "3656": 6, "23809": 6, "3705": 6, "24321": 6, "3738": 6, "35it": 6, "24833": 6, "3761": 6, "25345": 6, "3772": 6, "25857": 6, "3771": 6, "26369": 6, "3764": 6, "26881": 6, "3785": 6, "27393": 6, "3786": 6, "24it": 6, "27905": 6, "88it": 6, "28417": 6, "3807": 6, "30it": 6, "28929": 6, "27": [6, 9, 28], "65it": 6, "29441": 6, "29953": 6, "08": [6, 28], "3788": 6, "85it": 6, "30465": 6, "53": [6, 9], "30977": 6, "3803": 6, "08it": 6, "31489": 6, "70it": 6, "32001": 6, "91it": 6, "32513": 6, "3837": 6, "32it": 6, "33025": 6, "3826": 6, "33537": 6, "3830": 6, "47it": 6, "34049": 6, "09": [6, 30], "3824": 6, "56it": 6, "34561": 6, "3814": 6, "16it": 6, "35073": 6, "63it": 6, "35585": 6, "3794": 6, "94it": 6, "36097": 6, "21it": 6, "36609": 6, "67it": 6, "37121": 6, "37633": 6, "38145": 6, "3780": 6, "38657": 6, "39169": 6, "3784": 6, "39681": 6, "3534": 6, "17it": 6, "40193": 6, "3615": 6, "49it": 6, "40705": 6, "44": [6, 9, 28], "3673": 6, "41217": 6, "3717": 6, "41729": 6, "58": [6, 9], "3744": 6, "44it": 6, "42241": 6, "3762": 6, "42753": 6, "43265": 6, "3776": 6, "43777": 6, "44289": 6, "74it": 6, "44801": 6, "93it": 6, "45313": 6, "3813": 6, "76it": 6, "45825": 6, "3810": 6, "81it": 6, "46337": 6, "3797": 6, "46849": 6, "24": [6, 9, 28, 30], "3808": 6, "47361": 6, "47873": 6, "3821": 6, "48385": 6, "48897": 6, "51": [6, 9, 28], "3831": 6, "53it": 6, "49409": 6, "3853": 6, "49921": 6, "3863": 6, "50433": 6, "3828": 6, "31it": 6, "50945": 6, "51457": 6, "18it": 6, "51969": 6, "52481": 6, "52993": 6, "59": [6, 9, 28], "53505": 6, "3845": 6, "54017": 6, "69it": 6, "54529": 6, "55041": 6, "55553": 6, "56065": 6, "98it": 6, "56577": 6, "3835": 6, "13it": 6, "57089": 6, "3825": 6, "58it": 6, "57601": 6, "58113": 6, "58625": 6, "64it": 6, "59137": 6, "59649": 6, "83it": 6, "60161": 6, "60673": 6, "61185": 6, "61697": 6, "3819": 6, "62209": 6, "82it": 6, "62721": 6, "63233": 6, "63745": 6, "25": [6, 9, 16, 28], "64257": 6, "64769": 6, "65281": 6, "65793": 6, "3559": 6, "79it": 6, "66305": 6, "3616": 6, "66817": 6, "3644": 6, "67329": 6, "3684": 6, "67841": 6, "3735": 6, "68353": 6, "3747": 6, "68865": 6, "3769": 6, "69377": 6, "97it": 6, "69889": 6, "70401": 6, "3790": 6, "70913": 6, "71425": 6, "3777": 6, "71937": 6, "72449": 6, "3798": 6, "72961": 6, "62it": 6, "73473": 6, "73985": 6, "14it": 6, "74497": 6, "3822": 6, "01it": 6, "75009": 6, "75521": 6, "76033": 6, "76545": 6, "77057": 6, "77569": 6, "78081": 6, "60it": 6, "78593": 6, "79105": 6, "79617": 6, "80129": 6, "04it": 6, "80641": 6, "81153": 6, "68it": 6, "81665": 6, "25it": 6, "82177": 6, "82689": 6, "83201": 6, "51it": 6, "83713": 6, "84225": 6, "84737": 6, "85249": 6, "85761": 6, "3823": 6, "86273": 6, "86785": 6, "87297": 6, "87809": 6, "95it": 6, "88188": 6, "3767": 6, "88577": 6, "3484": 6, "52it": 6, "89089": 6, "3580": 6, "89601": 6, "3642": 6, "90113": 6, "3605": 6, "90625": 6, "3663": 6, "73it": 6, "91137": 6, "3709": 6, "91649": 6, "3723": 6, "92161": 6, "3755": 6, "54it": 6, "92673": 6, "3765": 6, "92it": 6, "93185": 6, "93697": 6, "94209": 6, "94721": 6, "45it": 6, "95233": 6, "95745": 6, "96257": 6, "3773": 6, "96769": 6, "97281": 6, "97793": 6, "98305": 6, "3832": 6, "98817": 6, "27it": 6, "99329": 6, "99841": 6, "100353": 6, "100865": 6, "101377": 6, "101889": 6, "99it": 6, "102401": 6, "102913": 6, "103425": 6, "103937": 6, "104449": 6, "104961": 6, "105473": 6, "105985": 6, "106497": 6, "3833": 6, "107009": 6, "107391": 6, "107777": 6, "3498": 6, "72it": 6, "108289": 6, "108801": 6, "109313": 6, "3704": 6, "109825": 6, "3743": 6, "110337": 6, "110849": 6, "111361": 6, "111873": 6, "112385": 6, "112897": 6, "113152": 6, "keyboardinterrupt": [6, 13], "traceback": [6, 12, 13, 23, 32], "recent": [6, 7, 12, 13, 23, 28, 31, 32], "cell": [6, 12, 13, 15, 23, 24, 28, 30, 32], "95": [6, 9], "as_tupl": 6, "batch_siz": [6, 13], "disabl": [6, 15, 21, 22, 23, 25, 26, 28, 32], "component_cfg": 6, "n_process": 6, "62": [6, 9], "noqa": 6, "plr0913": 6, "63": [6, 9, 28], "64": [6, 9, 12, 13, 28], "union": 6, "73": [6, 9, 28], "int": [6, 20], "74": [6, 9], "75": [6, 9, 28], "stream": 6, "76": [6, 9], "77": [6, 9], "arg": [6, 12, 13], "93": [6, 9], "94": [6, 9], "return": [6, 8, 11, 12, 13, 21, 33], "96": [6, 9, 28], "helper": 6, "clean_doc": 6, "processor": [6, 12], "97": [6, 9], "tqdm": 6, "98": [6, 9], "ignor": [6, 13, 28, 30], "overload": [6, 11, 30], "99": [6, 9, 16, 30], "102": [6, 9], "103": [6, 9], "104": [6, 9], "105": [6, 9], "106": [6, 9], "desc": 6, "107": [6, 9], "108": [6, 9], "109": [6, 9], "listcomp": 6, "std": 6, "1181": 6, "__iter__": 6, "1178": 6, "_time": 6, "1180": 6, "obj": 6, "1182": 6, "yield": 6, "1183": 6, "progressbar": 6, "1184": 6, "speed": 6, "optimis": 6, "1618": 6, "1616": 6, "1617": 6, "1619": 6, "1685": 6, "_pipe": 6, "proc": 6, "default_error_handl": 6, "kwarg": [6, 12, 13], "1675": 6, "1676": 6, "1677": 6, "pipecal": 6, "1682": 6, "map": [6, 27], "1683": 6, "1684": 6, "hasattr": 6, "1686": 6, "els": [6, 12, 13, 22, 27, 30], "1687": 6, "__call__": 6, "doesn": [6, 9, 11, 12, 20, 27], "t": [6, 8, 9, 11, 12, 13, 14, 20, 21, 23, 27, 32], "1688": 6, "dict": [6, 9, 12, 15, 20], "transition_pars": 6, "pyx": 6, "251": 6, "264": [6, 12], "285": [6, 9], "greedy_pars": 6, "thinc": 6, "334": 6, "x": [6, 8, 13, 22, 23, 26, 28], "330": [6, 12], "outt": 6, "331": [6, 12], "forward": [6, 13, 26], "is_train": 6, "fals": [6, 12, 15, 20, 21, 22, 23, 25, 26, 28], "332": [6, 15], "output": [6, 13, 15, 21, 22, 23, 26], "instead": [6, 12, 21], "callback": 6, "tupl": [6, 20], "333": 6, "_func": 6, "ml": [6, 14, 16, 17], "tb_framework": 6, "step_model": 6, "parserstepmodel": 6, "layer": [6, 13, 28], "unseen_class": 6, "has_upp": 6, "finish_step": 6, "parser_model": 6, "250": 6, "__init__": [6, 12], "310": 6, "307": 6, "bool": [6, 20, 22], "callabl": 6, "308": 6, "309": 6, "gradient": [6, 13], "via": [6, 33], "backpropag": 6, "chain": [6, 12], "y": [6, 8, 23, 26, 28], "inc_layer_grad": 6, "with_arrai": 6, "xseq": 6, "cast": 6, "seqt": 6, "_list_forward": 6, "xs": [6, 28], "numpy_op": 6, "asarray1i": 6, "seq": 6, "xf": 6, "flatten": 6, "pad": [6, 13, 28, 32], "yf": 6, "get_dxf": 6, "79": [6, 9], "backprop": 6, "dy": 6, "listxd": 6, "dyf": 6, "residu": 6, "d_output": 6, "dx": 6, "backprop_lay": 6, "isinst": 6, "skip": [6, 13, 30], "maxout": 6, "get_param": 6, "reshape2f": 6, "nO": 6, "np": 6, "ni": 6, "gemm": 6, "trans2": 6, "reshape1f": 6, "z": [6, 28], "reshape3f": 6, "shape": [6, 13, 16, 21, 22, 23, 25, 26], "ask": [7, 16, 27, 28], "method": [7, 8, 10, 11, 12, 13, 15, 16, 19, 20, 22, 24, 28, 30, 31, 32, 33], "simpl": [7, 20], "frequent": 7, "complic": [7, 8, 16, 21, 24, 27], "machin": [7, 14, 17, 19], "learn": [7, 8, 13, 14, 15, 19, 20, 21, 28, 32], "distinguish": [7, 20, 28, 33], "network": [7, 16], "graph": [7, 16], "focu": [7, 16, 28, 29, 32], "studi": [7, 27], "central": 7, "nuanc": 7, "necessarili": 7, "summar": 7, "sentiment": [7, 16], "analyz": [7, 10, 19, 22, 27, 30, 31], "while": [7, 19, 20, 21, 23, 25, 27], "approach": [7, 19, 25, 31], "decad": 7, "adop": 7, "probablist": 7, "algorithm": [7, 20], "autom": [7, 14, 33], "score": 7, "hard": [7, 11], "criteria": [7, 28, 32], "explicit": [7, 28], "directli": [7, 8, 11, 12, 14, 27, 28, 32, 33], "pre": [7, 8, 11, 12, 24, 28, 33], "tend": [7, 14, 16, 21], "todai": [7, 16], "combin": [7, 15, 23, 28], "speech": [7, 14, 16, 28, 32], "research": [7, 11, 14, 19, 27, 28, 30], "chart": 7, "voyant": 7, "favorit": [7, 33], "graphic": [7, 16], "Or": [7, 28, 32], "cyclic": 7, "feed": [7, 27, 28], "anoth": [7, 11, 15, 16, 19, 22, 27, 28], "circl": [7, 21], "back": [7, 12, 13, 14, 15, 21, 22, 23, 25, 26, 27], "jump": [7, 24], "discuss": [7, 9, 26, 27, 28], "briefli": [7, 23], "don": [8, 11, 12, 13, 21, 32], "either": [8, 13, 15], "keep": [8, 12, 13, 23, 27, 28], "funtion": 8, "cours": [8, 27, 28], "websit": [8, 11, 14, 15, 16, 19, 27, 28, 29, 30, 31, 32, 33], "transgender_text": 8, "html": [8, 11, 12, 27, 28, 30, 31, 32, 33], "altern": [8, 11, 12, 28], "uncom": 8, "bottom": [8, 28, 29, 32], "space": [8, 9, 11, 14, 15, 16, 22, 28, 32], "notic": [8, 9, 14, 21, 22, 23, 26, 28, 30], "loaded_text": 8, "1000": [8, 12, 28], "1112": [8, 9, 11, 12], "ih": [8, 11, 12], "n117th": [8, 11, 12], "1st": [8, 11, 12, 30], "report": [8, 11, 12, 28, 32], "militari": [8, 9, 11, 12], "coup": [8, 11, 12], "burma": [8, 11, 12], "n_______________________________________________________________________": [8, 11, 12], "februari": [8, 11, 12], "2021": [8, 11, 12], "mr": [8, 9, 11, 12], "connolli": [8, 11, 12], "himself": [8, 11, 12], "price": [8, 11, 12], "north": [8, 11, 12, 28], "carolina": [8, 11, 12, 28], "buchanan": [8, 11, 12], "foreign": [8, 11, 12], "affair": [8, 11, 12], "3000": [8, 12], "4000": 8, "burmes": [8, 11, 12], "threaten": [8, 11, 12, 28], "democrat": [8, 9, 11, 12], "trajectori": [8, 11, 12], "parliament": [8, 11, 12, 16], "therebi": [8, 11, 12, 21, 22, 23, 25, 26], "duli": [8, 11, 12], "elect": [8, 11, 12], "who": [8, 11, 12, 21, 22, 23, 25, 26, 27, 28, 29, 32, 33], "upon": [8, 11, 12, 29], "serv": [8, 11, 12, 33], "commun": [8, 11, 12, 21, 22, 23, 25, 26, 27], "conven": [8, 11, 12, 30], "should": [8, 11, 12, 20, 22, 25, 27, 28, 29, 32, 33], "laud": [8, 11, 12], "complet": [8, 11, 12], "imposs": [8, 11, 12], "nullifi": [8, 11, 12], "collabor": [8, 11, 12, 14, 24], "support": [8, 9, 11, 12, 28, 30, 32, 33], "strengthen": [8, 11, 12], "institut": [8, 11, 12, 19, 28, 32, 33], "partnership": [8, 11, 12], "hdp": [8, 11, 12], "nsec": [8, 11, 12], "statement": [8, 11, 12, 19, 20], "engag": [8, 11, 12, 16, 21, 22, 23, 25, 26, 28, 32], "associ": [8, 11, 12, 20, 21, 22, 23, 25, 26, 27, 28], "southeast": [8, 11, 12], "asian": [8, 11, 12], "asean": [8, 11, 12], "condem": 8, "larg": [8, 14, 20, 21, 22, 33], "blank": [8, 27], "_": [8, 12], "best": [8, 21, 33], "put": [8, 11, 12, 14, 20, 21, 22, 30, 33], "to_take_out": 8, "noth": [8, 21, 27], "overwrit": 8, "variabl": [8, 11, 15, 19, 21, 22, 24, 28, 30, 32], "officeh": [8, 12], "congress1st": [8, 12], "sessionh": [8, 12], "2021mr": [8, 12], "billto": [8, 12], "cite": [8, 11, 12], "protect": [8, 11, 12, 27, 28, 32], "democraci": [8, 11, 12], "On": [8, 11, 12, 14, 15, 27, 29], "march": [8, 11, 12, 30], "2005": [8, 11, 12], "agre": [8, 11, 12], "135": [8, 9, 11, 12], "commiss": [8, 11, 12, 28], "hereaft": [8, 11, 12], "di": 8, "sai": [8, 15, 22, 23, 26, 28, 29], "compon": [8, 16, 30], "parenthes": [8, 20, 21, 22, 23, 26], "moment": [8, 21, 27], "whatev": [8, 23, 28], "execut": [8, 20, 22, 23, 24, 28], "10021": 8, "10026": 8, "input": [8, 11, 13, 14, 15, 16, 20, 28], "insid": [8, 13, 15, 23, 28], "known": [8, 16], "formal": 8, "portabl": 8, "clean_up": [8, 12], "And": [8, 9, 26, 27, 28, 32], "clean_sampl": 8, "panda": [9, 10, 11, 12, 19, 30, 31, 32], "tabular": [9, 10, 11, 12, 30, 32], "spreadsheet": [9, 10, 11, 12, 28, 30, 32, 33], "pd": [9, 11, 12, 30, 32], "dimension": 9, "hold": [9, 11, 12, 32], "dictionari": 9, "csv": [9, 11, 12, 13, 15, 30], "gov": [9, 11, 12, 27, 30, 31], "upload": [9, 28], "congress_csv": [9, 12], "df": [9, 11, 12, 30, 32], "read_csv": [9, 11, 12], "transgender_raw_data": 9, "legisl": [9, 11, 12, 28, 29, 30, 32], "url": [9, 11, 12, 27, 28, 30, 32], "sponsor": [9, 11, 12, 28, 30], "parti": [9, 11, 12, 28], "introduct": [9, 11, 12, 19], "latest": [9, 11, 12], "211": [9, 12], "212": [9, 12], "213": [9, 12], "submit": [9, 11, 12, 28], "propos": [9, 10, 11, 12, 31], "www": [9, 11, 12, 27], "118th": [9, 12], "2024": [9, 12, 28, 29, 30], "readi": [9, 12], "jim": [9, 12], "rep": [9, 12], "republican": [9, 12], "arm": [9, 12], "servi": [9, 12], "nan": [9, 12, 13], "p": [9, 12, 19, 28, 29, 32], "435": [9, 11, 12], "rubio": [9, 12], "marco": [9, 12], "sen": [9, 12], "fl": [9, 12, 28], "886": [9, 11, 12], "principl": [9, 12, 28, 30, 31], "transg": [9, 12, 30], "jayap": [9, 12], "pramila": [9, 12], "judiciari": [9, 12, 30], "resolut": [9, 12, 28, 30], "464": [9, 11, 12], "hirono": [9, 12], "mazi": [9, 12], "star": [9, 12], "269": [9, 11, 12], "duti": [9, 12, 28], "workforc": [9, 12], "introductori": [9, 12, 19], "remark": [9, 12], "measur": [9, 12], "cr": [9, 12], "impl": [9, 12], "281": 9, "chair": 9, "yie": 9, "282": [9, 12], "biotechnolog": 9, "equip": 9, "produc": [9, 21, 22, 23, 25, 26], "283": 9, "provi": 9, "284": 9, "director": 9, "intellig": [9, 16], "submi": 9, "demand": [9, 21, 22, 23, 25, 26], "record": [9, 28], "vote": [9, 11, 12], "286": 9, "650": [9, 12], "da": 9, "gama": 9, "calado": [9, 15, 19], "ag": [9, 15, 26, 28], "degre": [9, 15], "literatur": [9, 15, 27], "job": [9, 15], "digit": [9, 26], "scholarship": 9, "specialist": 9, "index": [9, 15, 30], "core": [9, 11, 19, 28, 30], "rangeindex": [9, 11], "dtype": [9, 11, 12, 13, 30], "float64": [9, 11], "646": 9, "mb": 9, "miss": 9, "still": [9, 16, 20], "isol": [9, 23, 29], "148": [9, 11], "280": [9, 12], "int64index": [9, 30], "752": 9, "kb": [9, 11, 30], "arrai": 9, "cosponsor": 9, "48": [9, 28], "61": [9, 11], "65": 9, "66": [9, 12, 28], "67": 9, "68": [9, 28], "69": 9, "71": [9, 28], "78": 9, "81": 9, "82": 9, "83": [9, 28, 31], "84": 9, "85": [9, 16, 28], "86": 9, "87": [9, 10, 28, 31], "88": 9, "89": 9, "91": 9, "92": [9, 28], "110": 9, "111": 9, "112": 9, "113": 9, "114": [9, 11], "115": [9, 11], "116": 9, "117": [9, 11, 12, 28], "118": [9, 12, 13, 15, 30], "119": 9, "120": 9, "121": 9, "122": 9, "123": 9, "124": 9, "125": [9, 14], "126": [9, 13], "127": 9, "128": 9, "129": 9, "130": 9, "131": 9, "132": 9, "133": [9, 28], "134": 9, "136": 9, "137": 9, "138": 9, "139": 9, "140": 9, "141": 9, "142": 9, "143": [9, 11], "144": [9, 11, 12], "145": [9, 11], "146": [9, 11, 28], "147": [9, 11, 12], "149": [9, 12], "150": 9, "151": 9, "152": 9, "153": [9, 28], "154": [9, 12], "155": 9, "156": [9, 28], "157": 9, "158": [9, 28], "159": 9, "160": 9, "161": 9, "162": 9, "163": 9, "164": 9, "165": 9, "166": 9, "167": 9, "168": 9, "169": 9, "170": 9, "171": 9, "172": 9, "173": 9, "174": [9, 10, 31], "175": 9, "176": 9, "177": 9, "178": 9, "179": 9, "180": 9, "181": 9, "182": 9, "183": 9, "184": 9, "185": 9, "186": 9, "187": 9, "188": 9, "189": 9, "190": 9, "191": 9, "192": 9, "193": [9, 11, 12], "194": 9, "195": [9, 11, 12], "196": 9, "197": 9, "198": 9, "199": 9, "200": [9, 12, 28, 32], "205": 9, "206": 9, "207": 9, "208": 9, "209": [9, 12], "210": [9, 12], "214": [9, 12], "axi": 9, "down": [9, 14, 27, 28, 32], "400": [9, 28], "rest": [9, 13, 15, 21, 22, 23, 25, 26, 28], "434": 9, "431": 9, "503": 9, "ellips": 9, "anymor": 9, "rid": [9, 28], "mostli": [9, 27, 33], "232": 9, "229": 9, "null": [9, 11, 30], "workspac": 9, "to_csv": [9, 30, 32], "congress_clean": [9, 11], "legis": [10, 31], "transform": [10, 13, 14, 15, 16, 17, 19, 20, 26, 28, 33], "raw": [10, 30], "messi": [10, 30], "manipul": [10, 15, 20, 28, 33], "primarili": [10, 13, 17, 31], "built": 10, "libari": 10, "oop": 10, "mass": [10, 23], "coupl": [10, 21, 27, 31], "restrict": [10, 28, 31, 32, 33], "plai": [10, 15, 16, 29, 31], "Of": [10, 28, 31, 32], "legislatur": [10, 27, 28, 31], "compar": [10, 31], "2022": [10, 31], "share": [11, 27], "done": [11, 23, 26, 32, 33], "replic": 11, "reason": [11, 27, 28], "fyi": 11, "tri": [11, 27], "alwai": [11, 21, 22, 23, 25, 26, 33], "turn": [11, 12, 30], "futur": [11, 21, 22], "ll": [11, 14, 15, 16, 20, 21, 27, 28, 32], "wrote": 11, "relev": [11, 12, 30, 32], "regular": [11, 13, 20, 28], "side": [11, 14], "abil": [11, 28], "super": [11, 13, 14, 21], "won": 11, "notebook": 11, "grab": [11, 12, 21, 28], "found": [11, 12, 13, 15, 28], "sure": [11, 12, 13, 14, 26, 27], "datafram": [11, 30, 32], "column": [11, 12, 28, 30, 32], "unnam": 11, "int64": [11, 30], "amdt": [11, 12], "256": [11, 12], "255": [11, 12, 28], "isnumer": [11, 12], "row": [11, 12, 15, 28, 30], "scrape_bill_text": [11, 12], "bills_text": [11, 12], "hr": [11, 12, 28], "117hr": [11, 12], "htm": [11, 12], "enough": [11, 20, 26], "nunit": [11, 12], "nsection": [11, 12], "n2021": [11, 12], "independ": [11, 12], "approv": [11, 12, 28], "2016": [11, 12], "deleg": [11, 12], "meet": [11, 12, 22, 28, 32], "civilian": [11, 12], "led": [11, 12], "counselor": [11, 12], "aung": [11, 12], "san": [11, 12, 28], "suu": [11, 12], "kyi": [11, 12], "societi": [11, 12, 16], "leader": [11, 12], "depart": [11, 12, 28, 33], "assess": [11, 12, 27], "daw": [11, 12], "presid": [11, 12], "win": [11, 12], "myint": [11, 12], "head": [11, 12, 13, 28, 29, 32], "depos": [11, 12], "As": [11, 12, 19, 20, 26, 27, 28, 32], "declar": [11, 12, 21, 27, 28, 32], "martial": [11, 12], "suspend": [11, 12, 28], "detain": [11, 12], "newli": [11, 12], "capitol": [11, 12], "naypyidaw": [11, 12], "usurp": [11, 12], "seizur": [11, 12], "detent": [11, 12], "counsellor": [11, 12], "inabl": [11, 12], "begin": [11, 12, 19, 21, 25, 27, 28, 31, 32], "offici": [11, 12, 22, 26, 28], "mandat": [11, 12], "condemn": [11, 12], "urg": [11, 12, 28], "uncondit": [11, 12], "releas": [11, 12, 16], "appropri": [11, 12, 28, 30, 31, 33], "voic": [11, 12], "Not": [11, 12, 26, 28], "dai": [11, 12, 30, 33], "nthe": [11, 12], "nand": [11, 12], "nof": [11, 12], "ndescript": [11, 12], "effort": [11, 12], "implement": [11, 12, 28], "eventu": [11, 23, 30], "congress_dirty_csv": 12, "httperror": 12, "_decor": 12, "deprecate_kwarg": 12, "_deprecate_kwarg": 12, "wrapper": 12, "new_arg_nam": 12, "new_arg_valu": 12, "func": 12, "deprecate_nonkeyword_argu": 12, "decor": [12, 28, 32], "325": 12, "num_allow_arg": 12, "326": 12, "327": 12, "msg": 12, "argument": [12, 13], "_format_argument_list": 12, "allow_arg": 12, "328": 12, "futurewarn": 12, "329": 12, "stacklevel": 12, "find_stack_level": 12, "reader": [12, 21, 28], "950": 12, "filepath_or_buff": 12, "sep": 12, "delimit": [12, 22], "index_col": 12, "usecol": 12, "squeez": 12, "mangle_dupe_col": 12, "engin": 12, "true_valu": 12, "false_valu": 12, "skipinitialspac": 12, "skiprow": 12, "skipfoot": 12, "nrow": 12, "na_valu": 12, "keep_default_na": 12, "na_filt": 12, "verbos": 12, "skip_blank_lin": 12, "parse_d": 12, "infer_datetime_format": 12, "keep_date_col": 12, "date_pars": 12, "dayfirst": 12, "cache_d": 12, "chunksiz": 12, "compress": 12, "thousand": 12, "decim": [12, 20], "linetermin": 12, "quotechar": 12, "doublequot": 12, "escapechar": 12, "comment": [12, 21, 28, 32], "encod": [12, 15, 16], "encoding_error": 12, "dialect": 12, "error_bad_lin": 12, "warn_bad_lin": 12, "on_bad_lin": 12, "delim_whitespac": 12, "low_memori": 12, "memory_map": 12, "float_precis": 12, "storage_opt": 12, "935": 12, "kwds_default": 12, "_refine_defaults_read": 12, "936": 12, "937": 12, "946": 12, "default": [12, 13, 15, 22], "947": 12, "948": 12, "kwd": 12, "_read": 12, "605": 12, "602": 12, "_validate_nam": 12, "none": [12, 13, 28, 32], "604": [12, 30], "textfileread": 12, "607": 12, "608": 12, "1442": 12, "1439": 12, "has_index_nam": 12, "1441": 12, "iohandl": 12, "_engin": 12, "_make_engin": 12, "1735": 12, "1733": 12, "mode": [12, 33], "1734": 12, "get_handl": 12, "1736": 12, "1737": 12, "1738": 12, "1739": 12, "1740": 12, "1741": 12, "is_text": 12, "1742": 12, "strict": 12, "1743": 12, "1744": 12, "1745": 12, "assert": [12, 25], "1746": 12, "713": 12, "path_or_buf": 12, "710": 12, "codec": 12, "lookup_error": 12, "712": 12, "ioarg": 12, "_get_filepath_or_buff": 12, "714": 12, "715": 12, "716": 12, "717": 12, "718": 12, "719": 12, "721": 12, "722": 12, "basebuff": 12, "363": [12, 13], "361": [12, 13], "assum": 12, "interpret": [12, 25], "362": 12, "req_info": 12, "urllib": 12, "urlopen": 12, "req": 12, "364": [12, 13], "content_encod": 12, "365": [12, 13], "gzip": 12, "366": 12, "overrid": [12, 28], "265": 12, "259": 12, "260": 12, "lazi": 12, "stdlib": 12, "big": [12, 14, 16], "chunk": 12, "261": 12, "262": 12, "263": 12, "216": 12, "timeout": 12, "cafil": 12, "capath": 12, "cadefault": 12, "215": 12, "_open": 12, "525": 12, "openerdirector": 12, "fullurl": 12, "523": 12, "process_respons": 12, "protocol": [12, 27], "524": 12, "meth": 12, "getattr": 12, "meth_nam": 12, "527": 12, "634": 12, "httperrorprocessor": 12, "http_respons": 12, "631": 12, "rfc": 12, "2616": 12, "2xx": 12, "client": 12, "632": 12, "successfulli": 12, "receiv": [12, 28], "understood": 12, "accept": [12, 13, 20], "633": 12, "parent": [12, 28, 32], "635": 12, "hdr": 12, "637": 12, "557": 12, "proto": 12, "555": 12, "http_err": 12, "556": 12, "_call_chain": 12, "558": 12, "559": 12, "496": 12, "494": 12, "handler": 12, "495": 12, "497": 12, "498": 12, "749": 12, "httpredirecthandl": 12, "http_error_302": 12, "fp": 12, "746": 12, "747": 12, "563": 12, "561": 12, "562": [12, 28], "http_error_default": 12, "orig_arg": 12, "643": 12, "httpdefaulterrorhandl": 12, "642": 12, "rais": 12, "full_url": 12, "404": 12, "sdf": 12, "drop_dupl": 12, "subset": [12, 15], "congr": 12, "bob": 12, "va": 12, "a006": 12, "277": 12, "h2902": 12, "h2916": 12, "nfrom": 12, "bigg": 12, "andi": 12, "az": [12, 28], "a004": 12, "fail": [12, 14, 28], "268": 12, "repo": 12, "davidson": 12, "warren": [12, 16], "oh": [12, 28], "a041": 12, "2670": 12, "h3581": 12, "h3600": 12, "274": 12, "compris": 12, "amendm": 12, "roger": 12, "mike": 12, "al": [12, 19, 25, 28, 32], "a04": 12, "roi": 12, "chip": 12, "tx": [12, 28], "a040": 12, "o": [12, 22, 23], "chyna": 12, "gibson": 12, "stop": 12, "murder": 12, "epid": 12, "ideal": 12, "forc": [12, 16], "depend": [12, 20, 26, 27], "choic": [12, 28], "pride": 12, "mental": 12, "june": 12, "interna": 12, "patriot": 12, "gender_in_titl": 12, "remembr": [12, 30], "epidem": 12, "lost": 12, "safeti": [12, 28], "econom": [12, 28, 32], "secur": 12, "visibl": [12, 28], "902": 12, "4960": 12, "5196": 12, "1064": 12, "3850": 12, "568": 12, "418": 12, "4398": 12, "223": 12, "1960": 12, "persist": 12, "bs4": [12, 19, 27, 31], "beautifulsoup": [12, 28, 32], "scrape_just_text": 12, "118hr": 12, "soup": [12, 32], "lxml": [12, 28, 32], "stuff": 12, "get_text": 12, "full_text": 12, "desir": [12, 22, 28, 33], "FOR": 12, "bill_text": 12, "unwant": [12, 19], "whitespac": [12, 22], "__": 12, "replac": 12, "take_out": 12, "stat": 12, "pip": [13, 15], "trl": [13, 15], "load_dataset": [13, 15], "automodelforcausallm": 13, "autotoken": 13, "trainingargu": 13, "sfttrainer": 13, "from_pretrain": 13, "eleutherai": [13, 14, 15], "gpt": [13, 14, 15], "neo": [13, 14, 15], "125m": [13, 14, 15], "gofilipa": [13, 15], "gender_congress_117": [13, 15], "cach": [13, 15], "huggingfac": [13, 15, 17], "gofilipa___csv": [13, 15], "304e9fdc48b3d0d4": [13, 15], "6954658bab30a358235fa864b05cf819af0e179325c740e4bc853bcc7ec513e1": [13, 15], "size": [13, 14, 16, 28, 31, 32], "batch": 13, "fix": 13, "tensor": 13, "truncat": [13, 15], "deal": 13, "problem": [13, 14], "rectangular": 13, "vari": [13, 23, 27], "special": [13, 28], "shorter": [13, 28], "longest": 13, "maximum": 13, "direct": [13, 16, 22, 28], "pad_token": 13, "eos_token": 13, "padding_sid": 13, "training_param": 13, "output_dir": 13, "num_train_epoch": 13, "learning_r": 13, "2e": 13, "adjust": [13, 28], "loss": 13, "weight_decai": 13, "001": 13, "trainer": 13, "train_dataset": 13, "dataset_text_field": 13, "sft_trainer": 13, "246": 13, "didn": 13, "max_seq_length": 13, "1024": 13, "b4c92d61089f8e9c": 13, "arrow": 13, "epoch": 13, "358": 13, "neftune_noise_alpha": 13, "_trainer_supports_neftun": 13, "359": 13, "_trl_activate_neftun": 13, "retriev": 13, "embed": [13, 16, 27], "post": 13, "hook": [13, 21, 22, 23, 25, 26], "1780": 13, "resume_from_checkpoint": 13, "trial": 13, "ignore_keys_for_ev": 13, "1778": 13, "hf_hub_util": 13, "enable_progress_bar": 13, "1779": 13, "inner_training_loop": 13, "1781": 13, "1782": 13, "1783": 13, "1784": 13, "1785": 13, "2118": 13, "_inner_training_loop": 13, "2115": 13, "callback_handl": 13, "on_step_begin": 13, "2117": 13, "acceler": 13, "accumul": 13, "tr_loss_step": 13, "training_step": 13, "2120": 13, "2121": 13, "logging_nan_inf_filt": 13, "2122": 13, "is_torch_xla_avail": 13, "2123": 13, "torch": 13, "isnan": 13, "isinf": 13, "2124": 13, "2125": 13, "inf": 13, "simpli": [13, 20, 21], "averag": 13, "2126": 13, "tr_loss": 13, "global_step": 13, "_globalstep_last_log": 13, "3036": 13, "3033": 13, "loss_mb": 13, "reduce_mean": 13, "detach": 13, "devic": [13, 21, 22, 23, 25, 26], "3035": 13, "compute_loss_context_manag": 13, "compute_loss": 13, "3038": 13, "n_gpu": 13, "3039": 13, "multi": 13, "gpu": [13, 15], "parallel": [13, 15], "3059": 13, "return_output": 13, "3057": 13, "3058": 13, "3060": 13, "3061": 13, "todo": 13, "3062": 13, "past_index": 13, "nn": 13, "1511": 13, "_wrapped_call_impl": 13, "1509": 13, "_compiled_call_impl": 13, "misc": 13, "1510": 13, "_call_impl": 13, "1520": 13, "1515": 13, "logic": [13, 24, 32], "1516": 13, "1517": 13, "_backward_hook": 13, "_backward_pre_hook": 13, "_forward_hook": 13, "_forward_pre_hook": 13, "1518": 13, "_global_backward_pre_hook": 13, "_global_backward_hook": 13, "1519": 13, "_global_forward_hook": 13, "_global_forward_pre_hook": 13, "forward_cal": 13, "1522": 13, "1523": 13, "gpt_neo": 13, "modeling_gpt_neo": 13, "975": 13, "gptneoforcausallm": 13, "input_id": 13, "past_key_valu": 13, "attention_mask": 13, "token_type_id": 13, "position_id": 13, "head_mask": 13, "inputs_emb": 13, "use_cach": 13, "output_attent": 13, "output_hidden_st": 13, "return_dict": 13, "967": 13, "968": 13, "longtensor": 13, "sequence_length": 13, "969": 13, "shift": [13, 21, 22, 23, 25, 26, 27], "set": [13, 15, 28], "970": 13, "config": 13, "vocab_s": 13, "971": 13, "mask": 13, "972": 13, "973": 13, "use_return_dict": 13, "transformer_output": 13, "976": 13, "977": 13, "978": [13, 28], "979": 13, "980": 13, "981": 13, "982": 13, "983": 13, "984": 13, "985": 13, "986": 13, "987": 13, "988": 13, "hidden_st": 13, "990": 13, "lm_logit": 13, "lm_head": 13, "788": 13, "gptneomodel": 13, "785": 13, "past_length": 13, "787": 13, "arang": 13, "input_shap": 13, "789": 13, "unsqueez": 13, "791": 13, "792": 13, "793": 13, "attention_prob": 13, "bsz": 13, "num_head": 13, "794": 13, "n_layer": 13, "hypothesi": 13, "calcul": [13, 16], "descent": 13, "slowli": 13, "minim": 13, "save_pretrain": 13, "tokenizer_config": 13, "special_tokens_map": 13, "merg": 13, "added_token": 13, "max_length": [13, 15], "generated_text": [13, 15], "orrogen": 13, "aren": [13, 14], "great": [13, 23], "better": 13, "rate": 13, "move": [14, 16, 19, 26, 27], "ai": [14, 16, 27], "compani": [14, 27, 28, 32], "brooklyn": 14, "york": [14, 33], "citi": [14, 23, 28, 33], "host": [14, 24, 28], "had": [14, 16], "addit": [14, 21, 28, 29, 30], "besid": [14, 21, 27], "paper": [14, 16], "app": 14, "etc": [14, 20, 27, 28, 30, 33], "navig": [14, 27, 28, 30, 33], "classif": [14, 30], "filter": [14, 22], "wav2vec": 14, "audio": [14, 28], "vector": [14, 17], "roberta": 14, "permut": 14, "bert": [14, 16], "architectur": [14, 16], "click": [14, 15, 27, 28, 29, 33], "stabl": 14, "diffus": 14, "keyword": 14, "infer": [14, 17, 20], "enter": [14, 21, 24, 28, 32], "prompt": [14, 15], "hf": [14, 15], "amaz": [14, 20], "main": [14, 28], "explan": [14, 16], "licens": [14, 16, 19, 27, 28], "ethic": [14, 19, 21, 22, 23, 25, 26, 28, 31], "bias": 14, "environment": [14, 28, 32], "rare": 14, "profit": 14, "lab": 14, "preform": 14, "mit": 14, "permiss": [14, 16, 27], "modifi": [14, 21, 28], "wish": 14, "commerci": [14, 27, 28, 32], "mintu": 14, "anyth": 14, "repetit": 14, "highest": 14, "ones": [14, 17, 20, 21, 27], "evalu": [14, 20, 22, 26, 28], "littl": [14, 21, 28, 29], "peak": [14, 17], "dive": 14, "internet": [14, 27], "bia": 14, "attempt": [14, 27, 28], "dirti": 14, "obscen": [14, 28], "rlhf": 14, "reinforc": 14, "human": [14, 19, 20, 21, 25, 27, 28], "feedback": 14, "labor": 14, "exploit": [14, 21, 22, 23, 25, 26, 27], "tldr": 14, "race": [14, 21, 22, 23, 25, 26], "adequ": 14, "safe": [14, 28], "Will": 15, "talk": [15, 19, 20, 23, 33], "grappl": 15, "toolbar": 15, "ram": 15, "disk": 15, "hardwar": 15, "accel": 15, "copi": [15, 21, 27], "fanci": 15, "hello": [15, 20, 22, 23, 26], "explicitli": [15, 21, 22, 23, 25, 26], "max": [15, 28, 32], "longest_first": 15, "glue": 15, "precis": [15, 26], "pad_token_id": 15, "eos_token_id": 15, "50256": 15, "newbi": 15, "abstract": [15, 19, 25], "inspect": [15, 29], "first_nam": 15, "last_nam": 15, "loader": 15, "fork": 15, "avoid": [15, 22, 23, 30], "deadlock": 15, "tokenizers_parallel": 15, "datasetdict": 15, "num_row": 15, "dataset_dict": 15, "broad": 16, "artifici": 16, "vision": [16, 27], "howev": [16, 21, 23, 27], "hood": [16, 29], "chatgpt": [16, 27], "respond": [16, 28], "someon": [16, 21, 26], "question": [16, 21, 27, 28, 31], "massiv": 16, "glean": 16, "thank": [16, 30], "quantifi": 16, "technic": [16, 21, 27, 33], "togeth": [16, 20, 22, 27, 30], "coordin": 16, "probabl": [16, 23], "databas": 16, "cat": 16, "dog": 16, "must": [16, 20], "tiger": 16, "cute": 16, "bone": 16, "wolf": 16, "gensim": 16, "datast": 16, "twitter": [16, 28, 33], "glove": 16, "word2vec": [16, 17], "glove_vector": 16, "most_similar": 16, "9371739029884338": 16, "mother": 16, "9214695692062378": 16, "whose": [16, 22], "917497456073761": 16, "9146499633789062": 16, "913553774356842": 16, "wife": 16, "9088310599327087": 16, "9037442803382874": 16, "father": 16, "9028053283691406": 16, "gui": 16, "9026350975036621": 16, "8997253179550171": 16, "9065622687339783": 16, "8880172371864319": 16, "he": 16, "887438178062439": 16, "bad": 16, "8846145272254944": 16, "8832387924194336": 16, "8784030079841614": 16, "8764979243278503": 16, "8764553666114807": 16, "8762108683586121": 16, "glad": 16, "8758710622787476": 16, "protest": 16, "9241024851799011": 16, "9001613259315491": 16, "afghanistan": 16, "8905416131019592": 16, "activist": 16, "8872407078742981": 16, "troop": 16, "880148708820343": 16, "8785053491592407": 16, "8769642114639282": 16, "8767853379249573": 16, "prison": [16, 28], "8743768930435181": 16, "8693628311157227": 16, "cornel": 16, "8837954998016357": 16, "872944712638855": 16, "emori": 16, "8666537404060364": 16, "quinci": 16, "863002359867096": 16, "dudlei": 16, "8600769639015198": 16, "dayton": 16, "8584739565849304": 16, "carson": 16, "8520109057426453": 16, "savannah": 16, "8516344428062439": 16, "pearson": 16, "8490176200866699": 16, "trump": 16, "8488551378250122": 16, "math": 16, "linear": 16, "algebra": 16, "cosin": 16, "semant": [16, 20, 21, 23], "calculu": 16, "famou": 16, "formula": 16, "formular": 16, "realiz": 16, "deepli": [16, 33], "\u0153": 16, "exactli": 16, "subtract": 16, "jai": 16, "alammar": 16, "mechanim": 16, "2017": 16, "2018": 16, "Is": [16, 28], "matter": [16, 21, 27, 28], "taken": [16, 25, 28], "neural": 16, "took": 16, "preced": [16, 28], "With": [16, 19, 26, 28, 32], "stand": [16, 20, 23, 26, 28, 33], "bidirect": 16, "apach": 16, "inspir": [16, 19], "descend": 16, "firsthand": 16, "creation": [16, 27], "gigabit": 16, "week": 16, "further": [16, 23, 26, 27, 28, 32], "smaller": [16, 26, 32], "focus": [16, 28], "finbert": 16, "financi": [16, 27, 28], "de": 16, "mystifi": 16, "magic": 16, "intuit": [16, 21], "polish": 16, "applic": [16, 28, 29, 33], "major": [16, 28, 30, 33], "ever": 16, "ecosystem": 16, "platform": 17, "student": [17, 28, 32], "hpc": 17, "cluster": 17, "edu": 19, "friendli": [19, 27, 33], "langaug": 19, "varieti": 19, "third": [19, 21, 28], "fourth": [19, 21], "fifth": 19, "deep": [19, 20], "descript": [19, 21, 27, 28, 32], "fundament": 19, "ground": 19, "awar": [19, 33], "programmat": [19, 21, 23, 31, 32, 33], "metadata": [19, 31], "anti": [19, 28, 29], "usa": 19, "wrangl": 19, "emphasi": [19, 27], "skew": 19, "script": [19, 22, 25], "small": [19, 28, 31], "sign": [19, 28, 30, 33], "consult": 19, "curriculum": [19, 28], "graduat": 19, "challeng": 19, "feminist": [19, 21, 22, 23, 25, 26], "manifest": [19, 23, 25], "No": [19, 25, 28, 30], "cifor": [19, 25], "garcia": [19, 25], "et": [19, 25], "book": 19, "wjb": 19, "humanist": 19, "melani": 19, "walsh": 19, "analyt": 19, "noncommerci": 19, "sharealik": 19, "integ": [20, 22, 26], "boolean": [20, 26], "hear": [20, 28, 30], "w3school": [20, 22], "upcom": 20, "lesson": [20, 21], "letter": [20, 21, 22, 23, 28, 32], "symbol": [20, 21, 28], "enclos": 20, "truth": [20, 26], "falsiti": 20, "foundat": [20, 31], "donut": 20, "smoothi": 20, "coffe": [20, 21, 23, 26], "banana": 20, "abov": [20, 23, 26, 27, 28, 30, 33], "figur": [20, 26, 28, 32, 33], "softwar": [20, 24, 27, 33], "alphanumer": 20, "wrap": [20, 21, 28, 32], "quotat": [20, 21], "mark": [20, 21], "ocean": 20, "fall": 20, "perhap": [20, 21, 27], "blue": [20, 28], "depth": 20, "color": [20, 28, 32], "sensat": 20, "evok": 20, "readabl": 20, "inevit": 20, "reduc": [20, 25], "simplifi": 20, "thu": [20, 22], "said": [20, 21], "cannot": [20, 27], "headach": 20, "nuisanc": 20, "ascrib": 21, "implicit": 21, "bracket": [21, 22, 30], "breakfast": [21, 23, 26], "granola": [21, 26], "cashew": [21, 26], "yogurt": [21, 26], "strawberri": [21, 23], "mango": 21, "offset": [21, 28, 32], "movement": 21, "peek": 21, "strang": 21, "clockwis": 21, "counterclockwis": 21, "unlik": 21, "conveni": 21, "portion": 21, "colon": 21, "everi": [21, 22, 23, 25, 26, 27, 28, 32], "wonki": 21, "inclus": [21, 28], "exclus": [21, 28], "tricki": 21, "until": [21, 28, 30], "confus": 21, "memor": 21, "One": 21, "similarli": 21, "trick": 21, "nifti": 21, "yummi": 21, "bagel": 21, "cream": 21, "chees": 21, "orang": [21, 28], "juic": 21, "pop": [21, 28, 29], "off": [21, 22, 23, 25, 26, 27], "delet": 21, "sort": 21, "revers": [21, 28], "tripl": 21, "break": [21, 28, 32], "mess": 21, "refus": [21, 22, 23, 25, 26, 28], "oper": [21, 22, 23, 25, 26, 28], "risk": [21, 22, 23, 25, 26, 27], "harm": [21, 22, 23, 25, 26, 27, 28, 32], "bound": [21, 22, 23, 25, 26], "everyon": [21, 22, 23, 25, 26], "everywher": [21, 22, 23, 25, 26], "commit": [21, 22, 23, 25, 26, 27, 28, 30], "acknowledg": [21, 22, 23, 25, 26], "histor": [21, 22, 23, 25, 26], "vulner": [21, 22, 23, 25, 26, 27, 28], "disciplin": [21, 22, 23, 25, 26, 28], "racial": [21, 22, 23, 25, 26, 27], "track": [21, 22, 23, 25, 26, 27], "monitor": [21, 22, 23, 25, 26, 27], "surveil": [21, 22, 23, 25, 26, 27], "behav": [21, 22, 23, 25, 26], "technolog": [21, 22, 23, 25, 26, 27], "perpetu": [21, 22, 23, 25, 26], "embrac": [21, 22, 23, 25, 26], "intention": [21, 22, 23, 25, 26], "corpus": [21, 22, 23, 25, 26], "laid": [21, 22, 23, 25, 26], "whom": [21, 22, 23, 25, 26, 27], "disembodi": [21, 22, 23, 25, 26], "dehuman": [21, 22, 23, 25, 26], "departicular": [21, 22, 23, 25, 26], "various": [21, 22, 23, 25, 26], "attach": [21, 22, 23, 25, 26], "vow": [21, 22, 23, 25, 26], "interrog": [21, 22, 23, 25, 26], "biopolit": [21, 22, 23, 25, 26], "keen": [21, 22, 23, 25, 26], "ey": [21, 22, 23, 25, 26], "embodi": [21, 22, 23, 25, 26], "phoni": [21, 22, 23, 25, 26], "proclam": [21, 22, 23, 25, 26], "transpar": [21, 22, 23, 25, 26, 28, 32], "wield": [21, 22, 23, 25, 26], "cover": [21, 22, 23, 25, 26, 27], "escap": [21, 22, 23, 25, 26], "equiti": [21, 22, 23, 25, 26, 28], "justic": [21, 22, 23, 25, 26], "text_split": 21, "li": 21, "omit": 21, "spot": 21, "rogu": 21, "hint": 21, "rush": 21, "grasp": [21, 23], "alphabet": 21, "hashtag": [21, 28], "tell": [21, 27, 29], "pyhon": 21, "meant": [21, 28], "plenti": 21, "revisit": 21, "flow": 22, "throughout": [22, 27], "closer": 22, "equival": 22, "statment": 22, "greater": 22, "indent": 22, "group": [22, 24, 27], "written": [22, 28], "expand": [22, 28], "elif": 22, "catchal": 22, "l": [22, 23, 28], "rather": 22, "period": [22, 26], "indentationerror": 22, "unind": 22, "outer": [22, 28], "twenti": 22, "screen": [22, 23, 28, 32], "capit": [22, 23], "think": [22, 23, 26, 27, 28, 33], "congratul": 22, "conceptu": 23, "difficult": 23, "easier": [23, 28, 30], "egg": 23, "sandwich": 23, "biscuit": 23, "gravi": 23, "omelett": 23, "liter": 23, "fly": 23, "beforehand": 23, "nameerror": 23, "hasn": 23, "meaning": [23, 26], "concis": 23, "convent": 23, "shorthand": 23, "lisbon": 23, "setub": 23, "alcac": 23, "sal": 23, "lago": 23, "NO": [23, 25], "words_low": 23, "drop": 23, "intro": [24, 28, 32], "wherea": 24, "black": [24, 28], "box": [24, 27, 28, 32], "press": 24, "snippit": 25, "landmark": 25, "marika": 25, "patricia": 25, "aim": 25, "life": 25, "reduct": 25, "unavoid": 25, "consider": [25, 27, 31], "prioriti": 25, "almost": 26, "anybodi": 26, "encourag": [26, 27], "highli": 26, "accur": 26, "succinctli": 26, "muffin": 26, "minut": [26, 28], "upper": 26, "uppercas": 26, "greet": 26, "dot": [26, 28], "previous": 26, "correct": [26, 28], "deeper": [26, 28], "futher": 26, "recogniz": 26, "easili": 26, "dat": 26, "brief": [27, 33], "overview": [27, 29, 33], "michigan": 27, "guidebook": 27, "reproduc": 27, "outset": 27, "carefulli": 27, "pertain": 27, "affect": [27, 28], "especi": [27, 33], "communin": 27, "margin": [27, 28, 32], "yourself": [27, 33], "owner": [27, 33], "intend": 27, "basi": [27, 28], "standard": [27, 28, 32], "deliber": 27, "repurpos": 27, "ye": 27, "forgo": 27, "indigen": 27, "popul": 27, "reach": [27, 28, 30], "privat": [27, 28], "scrutini": 27, "benefit": [27, 28], "oppress": 27, "thought": 27, "distinct": 27, "free": [27, 28, 32, 33], "domain": 27, "holder": [27, 33], "ip": 27, "copyright": 27, "lead": 27, "permit": [27, 28], "mine": 27, "robot": 27, "privaci": [27, 28], "thoroughli": 27, "clearli": 27, "sidebar": [27, 32], "too": 27, "violat": [27, 28, 32], "academ": [27, 33], "sell": 27, "fair": [27, 28], "worth": 27, "openai": 27, "corner": 27, "compens": 27, "openli": 27, "stipul": 27, "worst": 27, "offend": [27, 28], "polic": 27, "facial": 27, "clearview": 27, "infam": 27, "imag": [27, 28], "media": [27, 28, 32], "enforc": [27, 28, 32], "profil": 27, "hurdl": 27, "aris": 27, "logist": 27, "path": [27, 28, 33], "negoti": 27, "wouldn": 27, "sought": 27, "scrapabl": 27, "com": [27, 28, 29, 30, 32], "came": 27, "aggreg": 27, "billtrack50": 27, "agent": 27, "disallow": 27, "bot": 27, "asterisk": 27, "shut": 27, "door": 27, "scraper": [27, 29, 33], "fairli": 27, "contend": 27, "admin": 27, "game": 27, "quickli": 27, "discov": 27, "dynam": [27, 33], "interfac": [27, 33], "static": 27, "javascript": [27, 33], "scrollabl": 27, "button": [27, 28, 32], "bar": 27, "reload": 27, "interestingli": 27, "lock": 27, "selenium": 27, "simul": [27, 33], "scroll": [27, 28], "unfortun": 27, "couldn": 27, "inspector": [27, 28, 32], "aclu": 27, "attack": 27, "obstacl": 27, "blocker": 27, "guard": 27, "wrong": 27, "webpag": [27, 28, 29, 32, 33], "credit": 27, "encount": 27, "curat": 27, "leglisl": 27, "wonderfulli": 27, "beautifulsoup4": 28, "translegisl": [28, 29, 32], "html_code": [28, 32], "target": 28, "red": 28, "closest": 28, "menu": [28, 29], "h3": [28, 32], "href": [28, 29, 32], "chakra": [28, 32], "css": [28, 32], "1vygpf9": [28, 32], "emot": [28, 32], "f4h6ui": [28, 32], "properti": [28, 32], "var": [28, 32], "durat": [28, 32], "fast": [28, 32], "eas": [28, 32], "cursor": [28, 32], "pointer": [28, 32], "webkit": [28, 32], "outlin": [28, 32], "2px": [28, 32], "solid": [28, 31, 32], "inherit": [28, 32], "hover": [28, 32], "underlin": [28, 32], "shadow": [28, 32], "hb261": [28, 32], "div": [28, 32], "reactroot": 28, "id": [28, 29, 32, 33], "__next": 28, "1o2ia7f": 28, "ring": 28, "inset": 28, "width": [28, 32], "0px": [28, 32], "fff": 28, "rgba": 28, "225": 28, "0000": 28, "currentcolor": 28, "000000": 28, "white": [28, 32], "ffffff": 28, "whitealpha": 28, "600": 28, "700": 28, "800": 28, "900": 28, "blackalpha": 28, "grai": [28, 32], "f7fafc": 28, "edf2f7": 28, "e2e8f0": 28, "cbd5e0": 28, "a0aec0": 28, "718096": 28, "4a5568": 28, "2d3748": 28, "1a202c": 28, "171923": 28, "fff5f5": 28, "fed7d7": 28, "feb2b2": 28, "fc8181": 28, "f56565": 28, "e53e3": 28, "c53030": 28, "9b2c2c": 28, "822727": 28, "63171b": 28, "fffaf0": 28, "feebc8": 28, "fbd38d": 28, "f6ad55": 28, "ed8936": 28, "dd6b20": 28, "c05621": 28, "9c4221": 28, "7b341e": 28, "652b19": 28, "yellow": 28, "fffff0": 28, "fefcbf": 28, "faf089": 28, "f6e05": 28, "ecc94b": 28, "d69e2e": 28, "b7791f": 28, "975a16": 28, "744210": 28, "5f370e": 28, "green": 28, "f0fff4": 28, "c6f6d5": 28, "9ae6b4": 28, "68d391": 28, "48bb78": 28, "38a169": 28, "2f855a": 28, "276749": 28, "22543d": 28, "1c4532": 28, "teal": 28, "e6fffa": 28, "b2f5ea": 28, "81e6d9": 28, "4fd1c5": 28, "38b2ac": 28, "319795": 28, "2c7a7b": 28, "285e61": 28, "234e52": 28, "1d4044": 28, "ebf8ff": 28, "bee3f8": 28, "90cdf4": 28, "63b3ed": 28, "4299e1": 28, "3182ce": 28, "2b6cb0": 28, "2c5282": 28, "2a4365": 28, "1a365d": 28, "cyan": 28, "edfdfd": 28, "c4f1f9": 28, "9decf9": 28, "76e4f7": 28, "0bc5ea": 28, "00b5d8": 28, "00a3c4": 28, "0987a0": 28, "086f83": 28, "065666": 28, "purpl": 28, "faf5ff": 28, "e9d8fd": 28, "d6bcfa": 28, "b794f4": 28, "9f7aea": 28, "805ad5": 28, "6b46c1": 28, "553c9a": 28, "44337a": 28, "322659": 28, "pink": 28, "fff5f7": 28, "fed7e2": 28, "fbb6ce": 28, "f687b3": 28, "ed64a6": 28, "d53f8c": 28, "b83280": 28, "97266d": 28, "702459": 28, "521b41": 28, "linkedin": 28, "e8f4f9": 28, "cfedfb": 28, "9bdaf3": 28, "68c7ec": 28, "34b3e4": 28, "00a0dc": 28, "008cc9": 28, "0077b5": 28, "005e93": 28, "004471": 28, "facebook": 28, "d9dee9": 28, "b7c2da": 28, "6482c0": 28, "4267b2": 28, "385898": 28, "314e89": 28, "29487d": 28, "223b67": 28, "1e355b": 28, "messeng": 28, "d0e6ff": 28, "b9daff": 28, "a2cdff": 28, "7ab8ff": 28, "2e90ff": 28, "0078ff": 28, "0063d1": 28, "0052ac": 28, "003c7e": 28, "002c5c": 28, "whatsapp": 28, "dffeec": 28, "b9f5d0": 28, "90edb3": 28, "65e495": 28, "3cdd78": 28, "22c35e": 28, "179848": 28, "0c6c33": 28, "01421c": 28, "001803": 28, "e5f4fd": 28, "c8e9fb": 28, "a8dcfa": 28, "83cdf7": 28, "57bbf5": 28, "1da1f2": 28, "1a94da": 28, "1681bf": 28, "136b9e": 28, "0d4d71": 28, "telegram": 28, "e3f2f9": 28, "c5e4f3": 28, "a2d4ec": 28, "7ac1e4": 28, "47a9da": 28, "0088cc": 28, "007ab8": 28, "006ba1": 28, "005885": 28, "003f5e": 28, "brand": 28, "2a69ac": 28, "153e75": 28, "border": [28, 32], "1px": [28, 32], "4px": 28, "8px": 28, "font": [28, 32], "appl": 28, "blinkmacsystemfont": 28, "sego": 28, "ui": 28, "helvetica": 28, "arial": 28, "serif": 28, "emoji": 28, "mono": 28, "sfmono": 28, "menlo": 28, "monaco": 28, "consola": 28, "liber": 28, "courier": 28, "monospac": 28, "fontsiz": [28, 32], "75rem": 28, "sm": [28, 32], "875rem": 28, "md": [28, 32], "1rem": 28, "lg": 28, "125rem": 28, "xl": [28, 32], "25rem": 28, "2xl": [28, 32], "5rem": [28, 32], "3xl": [28, 32], "4xl": 28, "5xl": 28, "3rem": 28, "6xl": 28, "7xl": 28, "8xl": 28, "6rem": 28, "9xl": 28, "8rem": 28, "fontweight": [28, 32], "hairlin": 28, "thin": 28, "light": 28, "medium": [28, 32], "semibold": [28, 32], "bold": [28, 32], "extrabold": 28, "letterspac": [28, 32], "tighter": 28, "05em": 28, "tight": 28, "025em": 28, "wide": [28, 32], "wider": 28, "widest": 28, "1em": 28, "lineheight": 28, "2rem": 28, "375": 28, "tall": 28, "625": 28, "taller": 28, "radii": 28, "375rem": 28, "9999px": 28, "4rem": 28, "7rem": 28, "9rem": 28, "10rem": 28, "11rem": 28, "12rem": 28, "13rem": 28, "14rem": 28, "15rem": 28, "16rem": 28, "18rem": 28, "20rem": 28, "24rem": 28, "px": 28, "625rem": 28, "3px": 28, "6px": 28, "10px": 28, "15px": 28, "20px": 28, "25px": 28, "5px": 28, "50px": 28, "12px": 28, "inner": 28, "dark": 28, "40px": 28, "min": [28, 32], "3x": 28, "2x": 28, "28rem": 28, "32rem": 28, "36rem": 28, "42rem": 28, "48rem": 28, "56rem": 28, "64rem": 28, "72rem": 28, "80rem": 28, "90rem": 28, "640px": 28, "768px": 28, "1024px": 28, "1280px": 28, "zindic": 28, "hide": 28, "auto": [28, 32], "dock": 28, "dropdown": [28, 29], "sticki": 28, "1100": 28, "banner": 28, "1200": 28, "overlai": 28, "1300": 28, "modal": 28, "1400": 28, "popov": 28, "1500": 28, "skiplink": 28, "1600": 28, "toast": 28, "1700": 28, "tooltip": 28, "1800": 28, "background": [28, 32], "stroke": 28, "opac": [28, 32], "dimens": 28, "height": [28, 32], "cubic": 28, "bezier": 28, "ultra": 28, "50m": 28, "faster": 28, "100m": 28, "150m": 28, "200m": 28, "slow": 28, "300m": 28, "slower": 28, "400m": 28, "500m": 28, "blur": 28, "16px": 28, "24px": 28, "64px": 28, "1jqlf9g": 28, "smooth": 28, "antialias": 28, "optimizeleg": 28, "moz": [28, 32], "osx": 28, "grayscal": 28, "touch": 28, "kern": 28, "overflow": [28, 32], "kbd": 28, "samp": 28, "abbr": 28, "strong": 28, "sub": 28, "sup": 28, "vertic": [28, 32], "align": [28, 32], "baselin": [28, 32], "25em": 28, "5em": 28, "img": 28, "optgroup": 28, "textarea": 28, "reset": 28, "fieldset": 28, "35em": 28, "75em": 28, "625em": 28, "legend": 28, "checkbox": 28, "radio": 28, "spin": 28, "textfield": 28, "itembox": 28, "templat": 28, "hidden": [28, 32], "blockquot": 28, "dl": 28, "dd": 28, "h1": [28, 29], "h2": [28, 29, 32], "h4": 28, "h5": 28, "h6": 28, "ol": 28, "ul": 28, "resiz": 28, "collaps": 28, "svg": 28, "video": 28, "canva": 28, "ifram": 28, "emb": 28, "js": 28, "1baqkrf": 28, "placehold": 28, "1v5zkf": 28, "flex": [28, 32], "flexbox": [28, 32], "60px": 28, "inlin": [28, 32], "1twb9xo": 28, "calc": 28, "48em": [28, 32], "103jld": 28, "pack": [28, 32, 33], "justifi": [28, 32], "nowrap": [28, 32], "middl": [28, 32], "radiu": [28, 32], "aria": [28, 32], "toggl": 28, "bokek7": 28, "shrink": 28, "icon": 28, "viewbox": 28, "0001": 28, "1ef8uzr": 28, "1g6ksko": 28, "1ynfsg": 28, "nd8846": 28, "stack": 28, "1yt6u0r": 28, "haspopup": 28, "dialog": 28, "trigger": 28, "rise": 28, "event": 28, "x7x3n6": 28, "nzo8h4": 28, "100px": 28, "ko": 28, "fi": 28, "src": 28, "kofi": 28, "png": 28, "1lgh1g": 28, "egoftb": 28, "lxmzlz": 28, "ryc07z": 28, "9y4vnp": 28, "home": 28, "11sp92w": 28, "1ff2web": 28, "6d6uom": 28, "qwq9lj": 28, "q2ryjt": 28, "1bd77w": 28, "600px": 28, "pr2tx6": 28, "bxak8j": [28, 32], "i3jkqk": 28, "18z2gjh": 28, "kxz3vr": 28, "b55202": [28, 32], "ic6w7t": 28, "3e3f30": [28, 32], "ax9tjb": 28, "a33469": [28, 32], "ip2ti6": 28, "005649": 28, "1nwst2d": 28, "005b99": 28, "13i6snw": 28, "713999": 28, "1nzw9zg": 28, "269686": 28, "1i3mhs2": 28, "3f2a56": 28, "incarcer": 28, "oamswl": 28, "c89f46": 28, "certif": 28, "181818": [28, 32], "11nx2ml": 28, "alabama": [28, 32], "arkansa": [28, 32], "florida": 28, "georgia": 28, "iowa": 28, "idaho": 28, "indiana": 28, "kansa": 28, "kentucki": 28, "louisiana": 28, "missouri": 28, "mississippi": 28, "montana": 28, "dakota": 28, "nebraska": 28, "ohio": 28, "oklahoma": 28, "south": 28, "tennesse": 28, "texa": 28, "utah": 28, "wisconsin": 28, "west": 28, "virginia": 28, "wyom": 28, "veto": [28, 30], "subsequ": 28, "1jb6aae": 28, "grid": 28, "repeat": 28, "minmax": 28, "1fr": 28, "1dqx0r": 28, "13ik503": 28, "dvhl9z": 28, "accordion": 28, "17mg6aq": 28, "anchor": 28, "accordion__item": 28, "1ygl3x": 28, "panel": 28, "accordion__button": 28, "1eziwv": 28, "186l2rg": 28, "2s": 28, "accordion__icon": 28, "m16": 28, "59l12": 28, "10l6": 28, "6z": 28, "1cu5i0n": 28, "labelledbi": 28, "accordion__panel": 28, "region": 28, "795uwx": 28, "35ezg3": 28, "oga2ct": [28, 32], "h1425": 28, "_self": 28, "bcf15j": [28, 32], "ks": 28, "hb2436": 28, "motion": 28, "prevail": 28, "yea": 28, "nai": 28, "sb233": 28, "1hlc5z2": 28, "e3e3e3": 28, "h1291": 28, "pend": 28, "governor": 28, "signatur": 28, "hb68": 28, "tn": 28, "sb2766": 28, "sb1182": 28, "sb1810": 28, "transmit": 28, "hb2169": 28, "comp": 28, "becam": [28, 30], "pub": 28, "ch": 28, "677": 28, "sb1738": 28, "sb2861": 28, "3e1l4l": 28, "182w0dq": 28, "1it7loc": 28, "4rck61": [28, 32], "1dvz6tu": [28, 32], "wd7aku": [28, 32], "bu60l4": [28, 32], "bp9bt3": [28, 32], "ellipsi": [28, 32], "clamp": [28, 32], "higher": [28, 32], "1975": [28, 32], "athlet": [28, 32], "team": [28, 32], "advers": [28, 32], "compli": [28, 32], "retali": [28, 32], "remedi": [28, 32], "suffer": [28, 32], "directi": [28, 32], "depriv": [28, 32], "1952nyr": [28, 32], "sb261": [28, 32], "iyw6hm": [28, 32], "contract": [28, 32], "government": [28, 32], "boycott": [28, 32], "busi": [28, 32], "sector": [28, 32], "corpor": [28, 32], "facilit": [28, 32], "penal": [28, 32], "declin": [28, 32], "polit": [28, 32], "ideolog": [28, 32], "attornei": [28, 32], "inflict": [28, 32], "resid": [28, 32], "investig": [28, 32], "hb1156": [28, 32], "bvx26t": [28, 32], "concern": [28, 32], "district": [28, 32], "enrol": [28, 32], "charter": [28, 32], "hb1468": [28, 32], "9x1vkf": 28, "employe": [28, 32], "prefer": [28, 32], "pronoun": [28, 32], "consent": [28, 32], "hb1615": [28, 32], "conscienc": [28, 32], "religi": [28, 32], "freedom": [28, 32], "restor": [28, 32], "sb125": [28, 32], "sb199": [28, 32], "p7xsfh": 28, "malpractic": [28, 32], "minor": [28, 32], "sb270": [28, 32], "crimin": [28, 32], "offens": [28, 32], "indec": [28, 32], "sb294": [28, 32], "provis": [28, 32], "earli": [28, 32], "childhood": [28, 32], "grade": [28, 32], "twelv": [28, 32], "sb43": [28, 32], "1j95h6q": 28, "adult": [28, 32], "h1069": 28, "1anmcl7": 28, "amp": 28, "revis": 28, "board": 28, "classroom": 28, "princip": 28, "h1521": 28, "restroom": 28, "willfulli": 28, "domest": 28, "complianc": 28, "born": 28, "s0254": 28, "grant": 28, "court": 28, "temporari": 28, "jurisdict": 28, "prescript": 28, "warrant": 28, "custodi": 28, "proceed": 28, "seriou": 28, "expend": 28, "patient": 28, "younger": 28, "immedi": 28, "practition": 28, "arrest": 28, "solicit": 28, "conspir": 28, "s0266": 28, "mission": 28, "plan": 28, "annual": 28, "expenditur": 28, "accredit": 28, "s1382": 28, "defens": 28, "superior": 28, "warfight": 28, "recruit": 28, "retain": 28, "personnel": 28, "sole": 28, "merit": 28, "maintain": 28, "warrior": 28, "etho": 28, "sb140": 28, "entitl": 28, "articl": 28, "regul": 28, "composit": 28, "repeal": 28, "conflict": 28, "ia": 28, "sf482": 28, "multipl": 28, "area": 28, "elementari": 28, "secondari": 28, "formerli": 28, "sf": 28, "335": 28, "sf496": 28, "children": 28, "guardian": 28, "attend": 28, "circumst": 28, "innov": 28, "zone": 28, "kindergarten": 28, "six": 28, "nonpubl": 28, "compet": 28, "ssb": 28, "1145": 28, "sf538": 28, "1197": 28, "conting": 28, "h0071": 28, "s1016": 28, "contractor": 28, "shower": 28, "room": 28, "s1100": 28, "hb1569": 28, "therapi": 28, "payment": 28, "monei": 28, "hb1608": 28, "staff": 28, "vendor": 28, "prekindergarten": 28, "notifi": 28, "unemancip": 28, "sb0480": 28, "knowingli": 28, "less": 28, "aid": 28, "abet": 28, "hb2100": 28, "invest": 28, "esg": 28, "subdivis": 28, "preferenti": 28, "procur": 28, "kper": 28, "fiduciari": 28, "beneficiari": 28, "indemnifi": 28, "adopt": [28, 30], "hb2138": 28, "substitut": [28, 30], "hb": 28, "2138": 28, "overnight": 28, "trip": 28, "broadcast": 28, "administr": 28, "perman": 28, "hb2238": 28, "sb180": 28, "1lgty6a": 28, "statutori": 28, "sb228": 28, "cfam9x": 28, "reimburs": 28, "counti": 28, "cost": 28, "jail": 28, "await": 28, "modern": 28, "statut": 28, "ky": 28, "sb145": 28, "interscholast": 28, "kr": 28, "070": 28, "elig": 28, "nonresid": 28, "manag": [28, 30], "sb150": 28, "notif": 28, "intent": [28, 30], "confidenti": 28, "pupil": 28, "conform": 28, "1415": 28, "la": 28, "hb648": 28, "mo": 28, "hb15": 28, "sb39": 28, "guidelin": 28, "contest": 28, "sb49": 28, "adolesc": 28, "experiment": 28, "hb1125": 28, "reap": 28, "eighteen": 28, "indirect": 28, "furnish": 28, "profession": 28, "emploi": 28, "dure": 28, "taxabl": 28, "premium": 28, "coverag": 28, "incom": 28, "tax": 28, "1972": 28, "medicaid": 28, "insur": 28, "exclud": 28, "medicin": 28, "tort": 28, "immun": 28, "219": 28, "unconstitut": 28, "mt": 28, "hb234": 28, "dissemin": 28, "hb303": 28, "divers": [28, 30], "hb359": 28, "drag": 28, "hb361": 28, "sb458": 28, "sb518": 28, "sb99": 28, "youth": 28, "nc": 28, "h574": 28, "h808": 28, "s49": 28, "nd": 28, "hb1139": 28, "15ear9v": 28, "reenact": 28, "centuri": 28, "hb1205": 28, "hb1249": 28, "co": 28, "hb1254": 28, "penalti": 28, "hb1297": 28, "hb1333": 28, "emption": 28, "hb1473": 28, "locker": 28, "dormitori": 28, "penitentiari": 28, "hb1474": 28, "scrap": 28, "metal": 28, "dealer": 28, "1254": 28, "sixti": 28, "eighth": 28, "1489": 28, "1249": 28, "1139": 28, "hb1489": 28, "hb1522": 28, "hcr3010": 28, "concurr": [28, 30], "vital": 28, "ne": 28, "lb574": 28, "grow": 28, "preborn": 28, "uniform": 28, "credenti": 28, "3109": 28, "054": 28, "3129": 28, "3313": 28, "5319": 28, "3345": 28, "colleg": 28, "ok": 28, "sb26": 28, "noncompli": 28, "sb404": 28, "substanti": 28, "burden": 28, "sb613": 28, "relief": 28, "licensur": 28, "sd": 28, "hb1080": 28, "hb0001": 28, "young": 28, "purport": 28, "inconsist": 28, "tca": 28, "hb0009": 28, "cabaret": 28, "hb0239": 28, "hb0306": 28, "membership": 28, "immut": 28, "hb0727": 28, "hb1269": 28, "teacher": 28, "lea": 28, "insul": 28, "liabil": 28, "sb0001": 28, "sb0003": 28, "sb0466": 28, "sb1237": 28, "sb1440": 28, "sb1443": 28, "sb12": 28, "premis": 28, "sb14": 28, "sb15": 28, "intercollegi": 28, "competit": 28, "sb17": 28, "ut": [28, 30], "hb0209": 28, "extracurricular": 28, "sb0016": 28, "sb0093": 28, "modif": 28, "sb0100": 28, "wi": 28, "sb70": 28, "financ": 28, "constitut": 28, "budget": 28, "fe": 28, "wv": 28, "hb2007": 28, "wy": 28, "sf0133": 28, "rulemak": 28, "hb2312": 28, "hb2786": 28, "sb1001": 28, "sb1026": 28, "moni": 28, "sb1028": 28, "sb1030": 28, "sb1040": 28, "sb1698": 28, "exposur": 28, "revoc": 28, "hb466": 28, "hb81": 28, "sb2231": 28, "discriminatori": 28, "ab465": 28, "441": 28, "448": 28, "1j": 28, "3m": 28, "1m": 28, "beauti": 28, "bill_titl": 28, "migrat": 28, "inforam": 28, "hyperlink": 28, "address": 28, "link_loc": 28, "far": 28, "granular": 28, "class_": [28, 32], "xxx": 28, "hb261sport": 28, "1ftdpv0": 28, "pan": 28, "mous": 28, "window": [28, 29], "highlight": 28, "beacaus": 28, "grap": 28, "bill_card": [28, 32], "partner": 28, "overwhelm": 29, "hypertext": 29, "markup": 29, "layout": 29, "dormous": 29, "stori": 29, "sister": 29, "elsi": 29, "link1": 29, "laci": 29, "link2": 29, "tilli": 29, "link3": 29, "unfamiliar": 29, "oppos": 30, "incorpor": 30, "authent": [30, 33], "queri": [30, 33], "getsearch": 30, "syntaxerror": 30, "invalid": 30, "page_tot": 30, "searchresult": 30, "wait": 30, "sleep": 30, "nest": 30, "concat": 30, "bill_numb": 30, "bill_id": 30, "change_hash": 30, "text_url": 30, "research_url": 30, "last_action_d": 30, "last_act": 30, "hb0316": 30, "1819064": 30, "bb27e8c4d929c9331af7b02dc6d81348": 30, "rul": 30, "inmat": 30, "dc": 30, "b25": 30, "0460": 30, "1778035": 30, "e96fc947b1b4170adf7a3fe91291a61b": 30, "mortal": 30, "cer25": 30, "0143": 30, "1782702": 30, "9aff2f06c9f9b38306f8f3a8e83183c8": 30, "acr25": 30, "0141": 30, "nov": 30, "vt": 30, "jrh004": 30, "1751508": 30, "bfb4a15ca9ece1f262e6ed5759e192ba": 30, "messag": 30, "joint": 30, "hr886": 30, "1784730": 30, "15a2a26d5c91782333a2b37fc8083154": 30, "hb2670": 30, "1757049": 30, "ccfa8fba0550b39bb71af841122e2132": 30, "sensibl": 30, "ac": 30, "mi": 30, "hb4437": 30, "1757146": 30, "604fc33c04c0b4d89cce5b8bd0d51893": 30, "disapprov": 30, "omnibu": 30, "mu": 30, "ny": 30, "s04007": 30, "1690727": 30, "1579358405b6c681a7bd5ed500b7ac14": 30, "chap": 30, "legislatio": 30, "s04004": 30, "1690688": 30, "30e29d6956eec2d3ff19a58c35ad73f8": 30, "BY": 30, "a3004d": 30, "a03004": 30, "1690608": 30, "b862da143af26ca5a2997011fc933673": 30, "thru": 30, "memo": 30, "legiscan_api_result": 30, "extrac": 31, "expert": 31, "workshsop": 31, "among": 31, "find_al": 32, "caption": 32, "attributeerror": 32, "nonetyp": 32, "extens": 32, "pseudo": 32, "descriptoin": 32, "ten": 32, "bunch": 32, "dump": 32, "robust": 32, "legiscan": [32, 33], "legiscan_link": 32, "anchor_tag": 32, "extra": 32, "inst": 32, "2817698": 32, "gove": 32, "2821857": 32, "2756961": 32, "2781770": 32, "2781807": 32, "bill_data": 32, "tab": 32, "acrossn": 32, "crawl": 33, "decid": 33, "invas": 33, "repeatedli": 33, "happi": 33, "archiv": 33, "catalog": 33, "email": 33, "librarian": 33, "weather": 33, "phone": 33, "temperatur": 33, "server": 33, "effici": 33, "nice": 33, "xml": 33, "reddit": 33, "skyscann": 33, "met": 33, "metropolitan": 33, "museum": 33, "art": 33, "endpoint": 33, "folder": 33, "collectionapi": 33, "metmuseum": 33, "directori": 33, "held": 33, "v1": 33, "q": 33, "searchterm": 33, "berth": 33, "morisot": 33, "painter": 33, "438009": 33, "scenario": 33, "rout": 33, "advantag": 33, "framework": 33, "shell": 33, "pagin": 33, "scale": 33, "driver": 33}, "objects": {}, "objtypes": {}, "objnames": {}, "titleterms": {"entiti": [0, 3], "ruler": 0, "1": [0, 2, 5, 32], "write": [0, 2, 5], "down": [0, 2], "code": [0, 2], "pattern": [0, 5], "2": [0, 2, 5, 32], "creat": [0, 2], "our": [0, 8, 11, 28, 32], "add": 0, "3": [0, 2, 32], "run": [0, 2, 5, 15], "nlp": [0, 7], "text": [0, 7, 8, 11, 19, 28], "4": [0, 2], "print": [0, 2, 5], "result": [0, 2], "workshop": [1, 10, 17, 19, 24, 31], "overview": [1, 10, 17, 19, 24, 31], "learn": [1, 10, 16, 17, 24, 31], "object": [1, 2, 3, 9, 10, 17, 24, 26, 28, 31], "googl": [1, 24, 29], "colab": [1, 15, 24, 29], "phrasematch": 2, "phrase": 2, "pass": 2, "your": 2, "spaci": 3, "pipelin": 3, "token": [3, 5], "part": 3, "speech": 3, "depend": 3, "name": [3, 23], "recognit": 3, "ner": 3, "doc": 3, "research": 4, "question": [4, 7], "defin": 4, "gender": 4, "anti": [4, 10, 27, 31], "tran": [4, 10, 27, 31], "legisl": [4, 10, 27, 31], "domain": 4, "specif": 4, "knowledg": 4, "close": 4, "read": 4, "dataset": [4, 14, 15], "matcher": 5, "configur": 5, "match": 5, "what": [7, 9, 27, 28, 33], "analysi": 7, "task": 7, "clean": [8, 9, 12], "inspect": [8, 28], "loop": [8, 22, 23], "through": 8, "replac": 8, "function": [8, 20, 26], "autom": 8, "datafram": [9, 12], "view": 9, "data": [9, 15, 20, 32], "info": 9, "head": 9, "tail": 9, "row": 9, "column": 9, "dropna": 9, "notna": 9, "drop": 9, "scrape": [11, 12, 29, 32, 33], "extract": 11, "bill": [11, 32], "number": 11, "decod": 11, "from": [11, 15, 32], "byte": 11, "string": [11, 23], "import": 12, "librari": [12, 15], "start": 12, "section": 12, "here": 12, "end": [12, 22], "OF": 12, "fine": [13, 16], "tune": [13, 16], "huggingfac": 14, "platform": 14, "model": 14, "hub": 14, "activ": 14, "5": 14, "10": 14, "minut": 14, "infer": 15, "open": [15, 25], "load": 15, "access": 15, "machin": 16, "word": 16, "vector": 16, "king": 16, "man": 16, "woman": 16, "queen": 16, "attent": 16, "mechan": 16, "train": 16, "why": 16, "am": 16, "i": [16, 27], "sai": 16, "all": 16, "thi": 16, "come": 18, "soon": 18, "intro": [19, 29], "python": 19, "work": 19, "seri": 19, "welcom": 19, "upcom": 19, "digit": 19, "scholarship": 19, "sourc": 19, "type": 20, "constraint": 20, "list": 21, "index": 21, "slice": 21, "method": [21, 23, 26], "logic": 22, "boolean": 22, "statement": 22, "condit": 22, "note": [23, 26], "variabl": [23, 26], "environ": 24, "challeng": [25, 28], "vs": [26, 33], "abstract": 26, "ethic": 27, "legal": 27, "everyth": 27, "exhibit": 27, "A": 27, "explor": 28, "bs4": [28, 32, 33], "page": [28, 32], "soup": 28, "get": 28, "attribut": 28, "find": 28, "find_al": 28, "group": 28, "html": 29, "inspector": 29, "legiscan": 30, "api": [30, 33], "step": 32, "isol": 32, "card": 32, "rest": 32, "pick": 32, "out": 32, "inform": 32, "each": 32, "process": 32, "about": 32, "save": 32, "csv": 32, "web": 33, "anatomi": 33, "url": 33, "tool": 33, "beautifulsoup4": 33, "scrapi": 33, "selenium": 33}, "envversion": {"sphinx.domains.c": 2, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 6, "sphinx.domains.index": 1, "sphinx.domains.javascript": 2, "sphinx.domains.math": 2, "sphinx.domains.python": 3, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.intersphinx": 1, "sphinxcontrib.bibtex": 9, "sphinx": 56}})