.dockerignore
.gitattributes
.gitignore
Dockerfile
LICENSE
README.md
approvaltests_config.json
cli
config.yml
pyproject.toml
.github/dependabot.yml
.github/release.yml
.github/workflows/ci.yml
.idea/dataSources.xml
.idea/jsLibraryMappings.xml
.idea/misc.xml
.idea/inspectionProfiles/Project_Default.xml
archive_query_log/__init__.py
archive_query_log/__main__.py
archive_query_log/config.py
archive_query_log/namespaces.py
archive_query_log/orm.py
archive_query_log.egg-info/PKG-INFO
archive_query_log.egg-info/SOURCES.txt
archive_query_log.egg-info/dependency_links.txt
archive_query_log.egg-info/entry_points.txt
archive_query_log.egg-info/requires.txt
archive_query_log.egg-info/top_level.txt
archive_query_log/archives/__init__.py
archive_query_log/captures/__init__.py
archive_query_log/cli/__init__.py
archive_query_log/cli/archives.py
archive_query_log/cli/captures.py
archive_query_log/cli/monitoring.py
archive_query_log/cli/parsers.py
archive_query_log/cli/providers.py
archive_query_log/cli/serps.py
archive_query_log/cli/sources.py
archive_query_log/cli/util.py
archive_query_log/downloaders/__init__.py
archive_query_log/downloaders/warc.py
archive_query_log/imports/__init__.py
archive_query_log/imports/aql22.py
archive_query_log/imports/archive_it.py
archive_query_log/imports/yaml.py
archive_query_log/legacy/__init__.py
archive_query_log/legacy/config.py
archive_query_log/legacy/conftest.py
archive_query_log/legacy/generate_review_sample.py
archive_query_log/legacy/service_stats.py
archive_query_log/legacy/cli/__init__.py
archive_query_log/legacy/cli/alexa.py
archive_query_log/legacy/cli/corpus.py
archive_query_log/legacy/cli/external.py
archive_query_log/legacy/cli/index.py
archive_query_log/legacy/cli/make.py
archive_query_log/legacy/cli/util.py
archive_query_log/legacy/download/__init__.py
archive_query_log/legacy/download/iterable.py
archive_query_log/legacy/download/raw.py
archive_query_log/legacy/download/warc.py
archive_query_log/legacy/index/__init__.py
archive_query_log/legacy/model/__init__.py
archive_query_log/legacy/model/highlight.py
archive_query_log/legacy/model/parse.py
archive_query_log/legacy/queries/__init__.py
archive_query_log/legacy/queries/iterable.py
archive_query_log/legacy/queries/parse.py
archive_query_log/legacy/results/__init__.py
archive_query_log/legacy/results/chatnoir.py
archive_query_log/legacy/results/parse.py
archive_query_log/legacy/results/test/__init__.py
archive_query_log/legacy/results/test/generate_tests.py
archive_query_log/legacy/results/test/test_360_serp_parsing.py
archive_query_log/legacy/results/test/test_aliexpress_serp_parsing.py
archive_query_log/legacy/results/test/test_amazon_serp_parsing.py
archive_query_log/legacy/results/test/test_ask_serp_parsing.py
archive_query_log/legacy/results/test/test_baidu_serp_parsing.py
archive_query_log/legacy/results/test/test_bing_serp_parsing.py
archive_query_log/legacy/results/test/test_bongacams_serp_parsing.py
archive_query_log/legacy/results/test/test_brave_serp_parsing.py
archive_query_log/legacy/results/test/test_canva_serp_parsing.py
archive_query_log/legacy/results/test/test_chefkoch_serp_parsing.py
archive_query_log/legacy/results/test/test_cnn_serp_parsing.py
archive_query_log/legacy/results/test/test_csdn_serp_parsing.py
archive_query_log/legacy/results/test/test_duckduckgo_serp_parsing.py
archive_query_log/legacy/results/test/test_ebay_serp_parsing.py
archive_query_log/legacy/results/test/test_ecosia_serp_parsing.py
archive_query_log/legacy/results/test/test_espn_serp_parsing.py
archive_query_log/legacy/results/test/test_etsy_serp_parsing.py
archive_query_log/legacy/results/test/test_facebook_serp_parsing.py
archive_query_log/legacy/results/test/test_github_serp_parsing.py
archive_query_log/legacy/results/test/test_google_serp_parsing.py
archive_query_log/legacy/results/test/test_imdb_serp_parsing.py
archive_query_log/legacy/results/test/test_imgur_serp_parsing.py
archive_query_log/legacy/results/test/test_indeed_serp_parsing.py
archive_query_log/legacy/results/test/test_jd_serp_parsing.py
archive_query_log/legacy/results/test/test_linkedin_serp_parsing.py
archive_query_log/legacy/results/test/test_manual_google_serp_parsing.py
archive_query_log/legacy/results/test/test_naver_serp_parsing.py
archive_query_log/legacy/results/test/test_pornhub_serp_parsing.py
archive_query_log/legacy/results/test/test_qq_serp_parsing.py
archive_query_log/legacy/results/test/test_qwant_serp_parsing.py
archive_query_log/legacy/results/test/test_reddit_serp_parsing.py
archive_query_log/legacy/results/test/test_roblox_serp_parsing.py
archive_query_log/legacy/results/test/test_sogou_serp_parsing.py
archive_query_log/legacy/results/test/test_stackoverflow_serp_parsing.py
archive_query_log/legacy/results/test/test_tribunnews_serp_parsing.py
archive_query_log/legacy/results/test/test_twitch_serp_parsing.py
archive_query_log/legacy/results/test/test_twitter_serp_parsing.py
archive_query_log/legacy/results/test/test_utils.py
archive_query_log/legacy/results/test/test_vk_serp_parsing.py
archive_query_log/legacy/results/test/test_weibo_serp_parsing.py
archive_query_log/legacy/results/test/test_wikimedia_serp_parsing.py
archive_query_log/legacy/results/test/test_xvideos_serp_parsing.py
archive_query_log/legacy/results/test/test_yahoo_serp_parsing.py
archive_query_log/legacy/results/test/test_yandex_serp_parsing.py
archive_query_log/legacy/results/test/test_youtube_serp_parsing.py
archive_query_log/legacy/serps/__init__.py
archive_query_log/legacy/serps/iterable.py
archive_query_log/legacy/services/__init__.py
archive_query_log/legacy/services/aggregate_services.py
archive_query_log/legacy/services/alexa.py
archive_query_log/legacy/services/search_forms.py
archive_query_log/legacy/services/test_services.py
archive_query_log/legacy/services/update_yaml.py
archive_query_log/legacy/urls/__init__.py
archive_query_log/legacy/urls/fetch.py
archive_query_log/legacy/urls/iterable.py
archive_query_log/legacy/util/__init__.py
archive_query_log/legacy/util/archive_http.py
archive_query_log/legacy/util/html.py
archive_query_log/legacy/util/http_session.py
archive_query_log/legacy/util/iterable.py
archive_query_log/legacy/util/serialization.py
archive_query_log/legacy/util/text.py
archive_query_log/legacy/util/urls.py
archive_query_log/monitoring/__init__.py
archive_query_log/monitoring/home.py
archive_query_log/parsers/__init__.py
archive_query_log/parsers/url.py
archive_query_log/parsers/url_offset.py
archive_query_log/parsers/url_page.py
archive_query_log/parsers/url_query.py
archive_query_log/parsers/util.py
archive_query_log/parsers/warc.py
archive_query_log/parsers/warc_query.py
archive_query_log/parsers/warc_snippets.py
archive_query_log/parsers/xml.py
archive_query_log/providers/__init__.py
archive_query_log/sources/__init__.py
archive_query_log/templates/home.html
archive_query_log/utils/__init__.py
archive_query_log/utils/es.py
archive_query_log/utils/time.py
data/.gitignore
data/selected-services.yaml
data/examples/results.jsonl
data/examples/serps.jsonl
data/manual-annotations/archived-raw-serps/expected/.gitignore
data/manual-annotations/archived-raw-serps/expected/360-21tian-jian-fei-fa-1653652529.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-an-jian-diao-cha-bi-lu-1576497545.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-chen-teng-tan-han-han-mei-ren-jie-ji-1577810108.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-duo-jia-ju-chang-qu-xiao-yan-chu-1579663841.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-hui-ji-pei-xun-1579668897.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-jin-ji-che-hui-1576637402.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-ju-min-jia-zhong-fei-jin-bian-fu-1585788499.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-lu-xing-she-tuan-dui-you-zan-ting-1580014331.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-mao-bu-yi-xiao-chou-chao-xi-1576791478.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-mei-guo-qian-zheng-1579954288.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-niu-jie-5hao-1576819311.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-shi-jie-zui-ai-de-ren-qu-shi-1579483438.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-si-chuan-fa-sheng-6-8ji-di-zhen-1662384982.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-site-chaxun-biz-1550145271.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-site-chaxun-biz-1550161171.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-site-chaxun-biz-1551742698.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-site-eng-kaz-enacademic-com-1581787441.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-tao-bao-ru-he-che-hui-ping-jie-1576604187.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-wu-xiu-bo-yang-kun-ju-hui-hai-ge-1577858222.approved.txt
data/manual-annotations/archived-raw-serps/expected/360-zhang-bo-zhi-bei-gou-yao-shang-1661090641.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-barefoot-accessories-1508385234.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-children-school-bag-1388612710.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-jewelry-sets-1390214039.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-kids-wear-1293514157.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-q5-phone-1374387535.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-sterling-silver-gemstone-1384701071.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-sterling-silver-pandora-charms-1457090417.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-transmission-shaft-1435605057.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-waterproof-winter-boots-women-1500418630.approved.txt
data/manual-annotations/archived-raw-serps/expected/aliexpress-women-messenger-bags-1397198302.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-deng-shi-jia-meng-www-baidu-com-aaaa-oq1-2018nian-8yue-19ri-19shi-32fen-18miao-1564357198.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-dnd-flash-mosquito-1633240377.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-eksa-1662208504.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-gaming-monitor-1639065822.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-guang-huaiba-pawa-me-ta-1632443655.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-guang-huaiba-pawameta-1632443655.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-gym-mat-tile-1634791656.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-joseph-menn-1605789427.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-lovense-1618431049.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-monitor-1625069899.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-notebook-dell-1613232661.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-omega-labyrinth-z-1616510370.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-pillow-fsa-1615964514.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-qian-lian-mo-hua-orizinarusaundotoratsuku-1657685343.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-solefit-1663015835.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-tazas-te-transparente-1613035337.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-the-montells-you-can-t-make-me-1617199271.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-the-risks-of-prescription-drugs-1657820625.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-under-armour-socks-1553107494.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-yangumagazin-yanmagasa-do-1625727694.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-yangumagazin-yanmagasado-1625727694.approved.txt
data/manual-annotations/archived-raw-serps/expected/amazon-zao-dian-jia-meng-pin-pai-www-baidu-com-aaaa-zv9-2018nian-8yue-21ri-17shi-49fen-4miao-1564430721.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-afraid-of-women-1172618037.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-apologist-1172369538.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-are-alkali-metals-lighter-than-water-1619387309.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-batman-movie-1467834503.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-big-tex-trailer-for-sale-1649774735.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-boxer-ear-crop-1173516809.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-caring-1173637789.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-cell-biology-1173639673.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-cure-for-boredom-1174210645.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-date-guy-fawkes-death-1173527460.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-diaframma-contraccezione-lang-it-1175070504.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-dog-ear-design-1172708874.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-fachkunde-metall-fur-ausbildung-in-maschinenbauberufen-1461053109.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-facula-site-www-wordreference-com-1173391757.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-failures-of-president-lincoln-1611567628.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-faither-site-www-accringtonweb-com-1173391901.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-five-phases-of-mitosis-1173539024.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-free-grammer-test-for-employment-1443411312.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-genus-falco-1172718376.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-http-my-notes-on-blogspot-com-1401243816.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-i-ve-site-news-bbc-co-uk-1172693923.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-if-you-break-a-fluorescent-light-bulb-1618021531.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-interior-design-classes-online-1651218822.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-japanese-airlines-1173622069.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-lopsided-site-www-usatoday-com-1173623642.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-meaning-of-integral-site-www-elook-org-1174247342.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-means-mutable-site-www-geek-interview-comrview-com-1173713625.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-means-mutable-site-www-geekinterview-com-1173392177.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-names-of-reggae-artists-1173527903.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-old-fashioned-labels-1172720557.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-olympic-rings-1172716332.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-perfect-first-date-1180217842.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-peter-krogh-photographer-1184320758.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-preparation-of-offal-1172710460.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-radioactivity-in-medicine-1173728275.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-rhino-records-1173555865.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-saiy-phiohom-1525375661.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-scorch-removal-1172719147.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-smirnoff-label-1173377085.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-tie-dye-patterns-1446417858.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-tye-dye-instructions-1446417925.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-vitamins-good-after-expiration-date-expires-site-www-cfs-purdue-edu-1173531858.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-weather-report-for-22903-1489829020.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-week-names-1173639143.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-what-s-california-s-state-bird-1175130217.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-what-should-i-wear-on-the-first-day-of-school-1442349823.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-what-words-rhyme-with-afraid-1173540494.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-whelped-definition-1173526805.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-who-framed-roger-rabbit-1473167643.approved.txt
data/manual-annotations/archived-raw-serps/expected/ask-www-ksu-edu-sa-1182367717.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-e-eeeae-1522165852.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-e-eeeae-1544443888.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-e-eeeae-1547510808.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-e-eeeae-1554431691.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-e-eeeae-1558963051.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-e-eeeae-1567878230.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-e-eeeae-1569971117.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-eru-1525597474.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-lian-xi-qu-dian-nao-pei-xun-1643390077.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-lian-yun-gang-qi-yang-yue-zi-hui-suo-zhong-xin-jing-zhun-ke-hu-ying-xiao-key668-cn-1537259978.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-long-feng-qu-qi-quan-qi-huo-pei-xun-1642853767.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-long-shi-liang-1639014949.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1549835769.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1553838201.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1558979495.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1564025418.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-mao-ning-kui-mao-dan-dan-mang-long-lou-mang-lu-shikato-1537858258.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-sexinsex-1-2-1213858525.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-shang-hai-11xuan-5ding-dan-wei-xin-weiwei776699-1545685930.approved.txt
data/manual-annotations/archived-raw-serps/expected/baidu-zhong-guo-lian-tong-smsc-1372160086.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-100-9-classic-country-radio-station-alaska-1660338459.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-1137ce-1639788231.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-1968-cougar-on-craigslist-1480218715.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-agent-077-mission-bloody-mary-movie-1593376539.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-aldershot-news-1629564105.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-allovercr-1423275634.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-arab-suck-and-fuck-bouchra-1365405319.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-blockbench-github-1652298697.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-christian-r-ntizimira-1607730426.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-classement-de-la-premier-league-1658725630.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-clay-andrews-1649253287.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-clobetasol-without-prescription-1615178898.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-cody-machan-facebook-1594008363.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-common-use-facilities-1643636012.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-computers-software-presentation-1488623366.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-connecticut-covid-deaths-1628019384.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-corner-app-1618998889.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-countercyclical-fiscal-policy-1643622693.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-crimson-coward-1640789839.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-customer-service-phone-number-for-hp-printer-1662986585.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-dan-robitzski-1660531082.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-dash-investment-foundation-1644415217.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-dataquantum-com-vancouver-hosting-1375879464.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-eero-pro-mesh-wifi-system-1659437763.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-elon-musk-tesla-stock-drop-1656685094.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-european-cannibalism-1591185526.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-explore-with-us-youtube-emma-1651605205.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-florence-caillon-bandcamp-1647897680.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-great-blue-heron-sound-1660552923.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-harukazewakaba0-1643181401.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-herzlich-willkommen-unterbindet-den-storeinfluss-bei-psychosen-1650332555.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-intel-i7-chip-1656625238.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-kumolife-1388896361.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-kutuklui-affair-1643643819.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-lake-wappapello-state-wildlife-area-1643615402.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-libyan-syrian-union-1643642965.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-limbpower-1640025328.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-limited-range-icbm-1643649846.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-mehmet-oz-florida-hunting-license-1657728564.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-mesozoic-wikipedia-1643229373.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-mighty-music-1578065758.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-nexus-mods-manager-1662582175.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-obama-speech-1274497739.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-regional-asia-taiwan-localities-taichung-city-1580952978.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-rpg-title-screen-1656104004.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-shang-chi-film-1563662560.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-sungard-1555022695.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-sweden-riots-1618569435.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-team-liquid-teams-1652030641.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-the-clavarioid-fungi-of-new-zealand-ron-petersen-1556393373.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-uscis-forms-400-1486690408.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-vintage-pittsburgh-steelers-steel-curtain-1497160668.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-wikipedia-orb-univers-de-fiction-1643880033.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-wikipedia-port-de-gennevilliers-metro-de-paris-1604443017.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-wikipedia-privatbrauerei-hoepfner-1620534005.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-wikipedia-rock-macabre-1603539954.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-wikipedia-sider-tribu-1593501017.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-wikipedia-vesuvius-1641311740.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-win10-iso-xia-zai-1580349240.approved.txt
data/manual-annotations/archived-raw-serps/expected/bing-wonder-kids-beginning-1652132287.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-asslicking-1623701105.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-camshow-1653633300.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-cock-sucking-1617355851.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-facial-1578106424.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-fucking-1577494848.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-hd-plus-1576443879.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-massage-1604010948.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-stripping-1623091287.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-stripping-1648087966.approved.txt
data/manual-annotations/archived-raw-serps/expected/bongacams-teasing-1635992326.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-67-degrees-c-static-atmosphere-1665006071.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-a2z-chip-1632000373.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-advanced-search-query-1667410105.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-amoled-1646168352.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-ape-1648509867.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-apple-t3-chip-1651405075.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-avnon-dan-1998-martin-buber-the-hidden-dialogue-lanham-boulder-new-york-oxford-rowman-littlefield-1649576842.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-best-notetaking-app-1654643212.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-bivoks-trebehandling-1654325149.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-chomikuj-1656776694.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-copyq-1665902945.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-cubecraft-skyblock-pig-farm-1664124008.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-dark-brown-mushrooms-that-melt-in-to-the-ground-1657827723.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-fastest-otto-guide-1649849902.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-froggy-pool-1651139840.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-google-play-store-1649985658.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-greentext-1664484724.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-h-m-home-1664916031.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-house-building-cost-estimate-1664320455.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-how-to-archive-mac-notes-1658260525.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-how-tot-ell-if-tail-recurssive-1658814198.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-import-esbuild-from-esbuild-syntaxerror-unexpected-identifier-1652662700.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-indiana-vaccine-passport-ban-1629877535.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-jinniebella-1666397597.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-kymatica-1652976922.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-logitech-1661137612.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-maintenance-1661082520.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-masi-uno-riser-chain-cover-1658006343.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-metaverse-1650224042.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-nair-1666404375.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-new-fold-4-1657628120.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-new-mac-os-release-1664483322.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-nvfbc-1651575025.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-openoffice-1667290210.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-pekara-fontana-niksic-1649235416.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-pizza-box-1662098145.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-product-life-cycle-definition-1664819445.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-random-number-python-1649475875.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-rent-1647905724.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-safemoon-1653585598.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-spigot-1660718390.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-terraform-github-container-1666470147.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-testimonies-project-1653158644.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-tina-daunt-1652776164.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-troll-1649987736.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-unremovable-1650484694.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-usb-3-1-type-c-dp-alt-mode-1667002333.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-utilitx-1659649168.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-video-1649793956.approved.txt
data/manual-annotations/archived-raw-serps/expected/brave-virtualbox-extensions-1667278528.approved.txt
data/manual-annotations/archived-raw-serps/expected/canva-instagram-reels-video-1607594697.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-35-backen-1351851992.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eier-milch-kse-kartoffeln-1318228714.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eier-parmesan-spinat-sahne-1206623203.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eier-spinat-pilze-1200619371.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eierflaumsuppe-1249321209.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eierlikr-gugelhupf-1203899612.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eierlikr-kirschkuchen-1243942587.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eierlikr-mit-kirsch-1375310772.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eierlikr-nachspeise-1255758312.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eierschwammerl-rahmsauce-1449833431.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eierschwammerl-und-gehacktes-1315110709.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-eifreier-hackbraten-1356156512.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-hhnchen-warme-1303285108.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-kirsch-1305195838.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-kohlroulade-gemse-1328779105.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-kseschnitzel-kse-1353053392.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-nudelsalat-mit-ei-1330099391.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-omas-blechkuchen-1355822404.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-roulade-braten-1355445937.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-sahne-und-himbeeren-1192658021.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spaghetti-eis-torte-1342866905.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spaghetti-hhnchen-1192740442.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spaghetti-mit-gemsesauce-1190132272.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spaghettie-mit-garnelen-1206750318.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spaghettitorte-vom-blech-1369060560.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spaghettoni-1206569039.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spanische-salat-1192556276.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spargel-geschlt-1278411144.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spargel-m-soe-1280861753.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spargel-risotto-mit-garnelen-1471699836.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spargel-wei-1194284442.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-speck-n-dicken-1370169101.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-speck-zucchini-eier-sahne-1222747904.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-speckbohnen-mit-kartoffeln-1352170361.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-speisestrke-sahne-1232351646.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-spinat-in-1220295440.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-streuselkuchen-aus-mrbeteig-1299585024.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-suppen-oder-eintpfe-1256106491.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-sushi-mit-normalem-reis-1470947014.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-syrische-pasta-1466000049.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-tabouleh-rosinen-1382360347.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-tatar-steak-1266004316.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-tempura-1213419780.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-thai-curry-1246123954.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-thai-curry-einfach-1420408232.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-thailndisch-1313401080.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-thermomix-gefllten-1390802313.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-tomaten-mozarella-reis-1317162887.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-tupperware-hefe-1356254719.approved.txt
data/manual-annotations/archived-raw-serps/expected/chefkoch-walnussl-dressing-1403236002.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-achievable-possibility-1642416655.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-apple-watch-2016-1662575890.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-biteukoinsaryeomyeon-www-99m-kr-bei-biteukoinsaryelie-biteukoinsaeobbbiteukoinsaeobjadeungrog-biteuk-1647153716.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-biteukoinsaryeomyeon-www-99m-kr-bei-biteukoinsaryelie-biteukoinsaeobbbiteukoinsaeobjadeungrog-biteukoinsayongbangbeob8reduplicate-1647153716.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-dxa-1634498874.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-kindly-check-1642508434.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-march-4-1633908556.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-north-dakota-coronavirus-1632793271.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-skilled-1643388398.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-trigger-1638271567.approved.txt
data/manual-annotations/archived-raw-serps/expected/cnn-wright-1616229078.approved.txt
data/manual-annotations/archived-raw-serps/expected/csdn-android-studio-1660487187.approved.txt
data/manual-annotations/archived-raw-serps/expected/csdn-fifo-1663204137.approved.txt
data/manual-annotations/archived-raw-serps/expected/csdn-rows-1665572662.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-145-lbs-to-kg-1664351690.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-150-degrees-to-radians-site-degreestoradians-net-1662073498.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-2-5-muiles-to-km-1648676868.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-2022-07-12-23-00-site-www-time-time-net-1657640396.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-25-c-to-f-site-www-metric-conversions-org-1655636638.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-32168-weather-radar-1667504070.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-3rd-party-twitch-chat-1642095474.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-40-mile-creek-trail-site-www-arizonahighways-com-1657173375.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-branch-conventions-git-site-social-msdn-microsoft-com-1664392383.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-breaking-news-on-sierra-leone-1663541702.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-broken-reality-steam-site-www-huntmar-com-1597289631.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-buck-showalter-seinfeld-1654420295.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-build-chest-freezer-site-www-quora-com-1654893310.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-bulk-copper-pennies-for-sale-1646606334.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-burnout-paradise-online-multiplayer-with-all-dlc-site-www-counton-org-1655566858.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-c-pretty-print-json-1662310061.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-elite-dangerous-covas-site-www-pcgamer-com-1653704722.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-elite-dangerous-site-www-thegamer-com-1658908937.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-elton-john-site-www-esquire-com-1657307467.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-emoji-pedia-site-www-youtube-com-1590838578.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-empure-site-empure-in-1664600213.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-encountered-conflicts-when-cherry-picking-commit-1618189582.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-enneagram-test-site-www-crystalknows-com-1638683347.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-equation-of-dissociation-of-sulfuric-acid-site-www-sciencedirect-com-1649296927.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-erik-erikson-s-theory-site-positivepsychology-com-1654620203.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-gimp-use-align-tool-site-thegimptutorials-com-1653712700.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-jeanne-d-arc-site-id-wikipedia-org-1655183773.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-llanelly-carmarthenshire-wales-1655261859.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-newest-call-of-duty-game-1653477001.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-quit-telnet-site-www-codegrepper-com-1665105234.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-sheer-skirt-beach-thing-site-www-lyst-com-1653921398.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-sheets-site-www-kohls-com-1642928572.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-sheydim-site-www-sefaria-org-1664233097.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-simplify-subtraction-of-fractals-site-www-thecalculator-co-1637459222.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-sims-castaway-trailer-1647012563.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-u-team-1636548723.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-ubuntu-mesa-intel-r-hd-graphics-620-kbl-gt2-site-forum-unity-com-1658976095.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-ubuntu-netplan-package-site-www-ubuntuupdates-org-1665115336.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-ukraine-site-www-cfr-org-1646796603.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-united-reformed-churches-in-north-america-1446324275.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-universal-logs-checker-1-1-0-site-cracking-org-1656559962.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-update-admx-files-on-domain-controller-1660061931.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-waldo-s-chicken-site-waldoschicken-com-1654372116.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-warren-hunt-1635806147.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-waterford-house-erfstadt-court-wokingham-berkshire-rg40-2yf-google-maps-1660892879.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-we-acknowledge-the-traditional-custodians-of-the-land-on-which-our-office-stands-the-wurundjeri-peop-1654920640.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-webassembly-browser-support-list-1653198525.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-website-sitemap-finder-site-seositecheckup-com-1614287233.approved.txt
data/manual-annotations/archived-raw-serps/expected/duckduckgo-what-happened-to-greta-thornburg-1667535932.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-1-4-1566151598.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-hu-bei-kuai-san-zhong-jiang-zhu-shou-jia-wei-vxin-weiwei776699-1548361753.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-imaginext-batman-motorcycle-1597143554.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-liu-he-cai-2o2526-wei-xin-weiwei776699-1562672411.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-liu-he-cai-gua-pai-wan-zheng-ban-wei-vxin-weiwei776699-1565563054.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-se-xing-mei-jia-wei-vxin-dun35358-1544323503.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-shan-dong-11xuan-5-360cai-piao-wei-xin-weiwei776699-1538125942.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-smartphones-1334931269.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-srch-str-1641320481.approved.txt
data/manual-annotations/archived-raw-serps/expected/ebay-victoria-s-secret-1559541146.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-8-ft-to-cm-1629639998.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-average-amount-of-photos-you-could-take-on-a-camera-in-1940-s-1572660962.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-barnes-1636235793.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-by-talos-this-cant-be-happening-1630519906.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-can-you-show-smoking-on-tv-1624555764.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-coding-freelancing-1634534706.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-correct-way-to-wash-hair-oily-scalp-1588676008.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-dall-e-1654952788.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-deaf-community-1626760345.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-financial-risk-tolerance-quiz-1643759873.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-foot-to-centimeter-1612629786.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-form-1694-instructions-1635977208.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-free-file-sharing-services-1638926359.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-fudanshi-1655238275.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-game-changer-classic-1638948940.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-git-create-pull-request-1655702772.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-gmail-sign-in-1637276050.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-gnome-desktop-entry-1655209403.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-google-image-scraper-1601781718.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-grady-white-ce-251-1636884788.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-h-and-m-clothing-sale-1635863133.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-hallam-f-c-1596174558.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-harry-styles-siblings-1634695267.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-health-conditions-and-diseases-neurological-disorders-meningitis-1666663445.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-high-functioning-depression-23w-1615448305.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-hisotry-of-tomato-in-india-23yt-1591696836.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-hm-219c-1637494750.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-how-much-doordash-driver-make-1654857157.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-how-to-be-more-generous-1590871266.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-how-to-check-if-a-value-is-null-in-c-1639813391.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-laughter-stories-1640836502.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-macglauglin-1640487447.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-percy-jackson-s-greek-gods-1634509308.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-saltpeter-beds-1643653808.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-sin-is-an-ugly-creature-1590737798.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-vasectomy-reversal-success-rate-23yt-1623229800.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-virtual-studio-code-download-for-windows-10-1642714491.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-watch-tv-series-23g-1602851877.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-we-will-rock-you-23yt-1587407460.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-west-point-nebraska-1644663254.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-what-does-god-do-to-tratorirs-1590883066.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-what-is-a-description-1655190914.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-what-s-the-shortest-war-ever-1635275630.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-where-are-my-chrome-extensions-1635276242.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-whiteman-afb-public-affairs-1636203076.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-why-can-t-you-order-international-nail-polish-online-india-23a-1586448930.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-windows-11-activator-reddit-1637172885.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-windows-for-workgroups-3-11-iso-1644191359.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-world-deutsch-regional-europa-deutschland-baden-wurttemberg-stadte-und-gemeinden-karlsruhe-1621530240.approved.txt
data/manual-annotations/archived-raw-serps/expected/ecosia-world-deutsch-regional-europa-deutschland-hessen-landkreise-rheingau-taunus-kreis-stadte-und-gemeind-1595135090.approved.txt
data/manual-annotations/archived-raw-serps/expected/espn-ball-state-1615730301.approved.txt
data/manual-annotations/archived-raw-serps/expected/espn-ball-state-1619440827.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-andrew-kim-1566153959.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-embroidery-kit-1375805089.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-hard-plastic-1333819223.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-invitation-1367234841.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-pacifier-1336437253.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-pendants-1667648711.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-small-animal-1378528595.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-storage-and-organization-1632881953.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-sundress-1374472455.approved.txt
data/manual-annotations/archived-raw-serps/expected/etsy-yan-dong-kuai-le-shi-fen-shou-ji-ban-jia-wei-xin-xw639-2018-1537911471.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-1-million-cards-1614844146.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-3dnoam-chomsky-1611582471.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-3dtaylor-company-1611665585.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-5-orszagos-1618089409.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-7-1620274873.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-abbvie-1623327630.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-aj-duca-1388091562.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-alda-lesbiennes-refugiees-1615284371.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-anthony-1376743219.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-bernieorbust-1467812085.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-blog-post-319-je31-1567459151.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-blog-post-334-bootload-1567494170.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-cruzcrew-1459272010.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-deanna-sanchez-1629215596.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-greet-1623235952.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-https-peelarchivesblog-com-about-peel-1599241783.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-ineligible-1466870871.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-jam-of-the-day-1410919861.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-mens-health-survival-of-the-fittest-1619473718.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-mr-robot-1469187052.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-rosy-20gupta-1494524363.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-social-plugins-boutons-jaime-envoyer-partager-et-citations-js-exec-je31-1567485463.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-solcellespecialisten-1389488036.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-tag-someone-who-needs-this-1587554575.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-trumptrain-1461904486.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-vanilla-1481832838.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-victoria-pynchon-1294673180.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-virpi-soikkeli-1623257178.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-wisconsin-1463064570.approved.txt
data/manual-annotations/archived-raw-serps/expected/facebook-www-9xcb-biz-webex-setup-was-unsuccessful-error-23-1404412853.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-jie-shi-de-jing-mi-gong-ye-you-xian-gong-si-1597737683.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-licensing-gethhwid-1662581846.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-mastodon-1657854340.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-org-zettlr-1591675518.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-subrock-1653099784.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-topic-bootswatch-org-sslcom-1552777180.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-topic-deprecated-org-bandwidth-fork-true-1634361552.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-topic-docker-stack-org-issuu-1549097482.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-topic-id-org-codercom-1553274306.approved.txt
data/manual-annotations/archived-raw-serps/expected/github-topic-web-components-org-github-fork-true-1650012538.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-243-1628713922.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-9-11-revisited-1618106149.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-agust-1614235489.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-atalanta-bergamasca-calcio-wikipedia-1643703998.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-attack-on-titan-season-3-part-2-1556408967.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-bill-easley-sophisticated-prelude-1626498182.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-boulevard-records-canada-site-wikipedia-org-site-wikimedia-org-1510135498.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-bouncing-hero-switch-site-easyallies-com-1633303267.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-bozsa-bence-site-hu-wikipedia-org-1647787452.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-can-ju-ying-yu-1560296360.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-chi-zhen-nzhong-rong-keteru-1608917828.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-compress-tube-wikipedia-1644670761.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-coneybury-anomaly-wikipedia-1640176109.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-conflict-middle-east-wikipedia-1636797028.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-continental-automotive-systems-wikipedia-1651015350.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-cortisol-test-1623205666.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-coxsackie-virus-1617107799.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-crow-names-1608438374.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-dead-cock-mortuary-1614203203.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-diffusion-systems-for-evaluation-of-biomineralization-1618448715.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-does-steve-has-a-beard-1601705030.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-dove-soap-1617107771.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-evan-colborne-1647984326.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-facebuster-1650197554.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-fatmira-brecani-1662136538.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-fer-palacio-1631069534.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-film-review-annual-1660769248.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-finance-1540158323.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-flop-thumbs-up-1568839345.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-focusrite-1641240556.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-forced-labor-in-california-1635373615.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-front-polisario-khat-al-shahid-1652852892.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-future-planning-1648480487.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-george-w-summers-1637786317.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-giulia-botti-1660836463.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-gnosticism-1615175612.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-grasshopper-design-pvt-ltd-1640249780.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-green-capital-energy-site-wikipedia-org-site-wikimedia-org-1657756151.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-green-wave-106-5-fm-1637281540.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-guntury-1650179158.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-hawaii-part-ii-lyrics-1633318830.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-hola-games-1552338270.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-homemade-l-1617107839.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-kolex-1645947964.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-kostiantyn-magaletskyi-1638351261.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-kothuru-assembly-constituency-1631384737.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-kurabayashi-1643815267.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-kush-raval-indian-cricketer-site-wikipedia-org-site-wikimedia-org-1649726560.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-la-pipa-1635023533.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-lars-brygmann-1633135602.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-laxmikant-pyarelal-1657295550.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-lenin-1614385592.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-leo-de-la-strehaia-1633884656.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-lige-gardner-1637042221.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-list-of-cantons-of-france-1634951028.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-list-of-crossings-of-the-james-river-1662064377.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-list-of-grand-dukes-of-russia-1645733808.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-list-of-surviving-lockheed-f-104-starfighters-1662745731.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-lope-recio-loynaz-1658853508.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-lucas-ruzin-1658326494.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-lucius-vibullius-rufus-son-in-law-of-herodes-atticus-1642439444.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-luiz-carlos-footballer-born-1980-wikipedia-1637131910.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-lycee-francais-louis-pasteur-de-lagos-1638831028.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-modern-times-chaplin-watch-online-1662343522.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-now-it-s-time-for-your-treatment-relax-make-yourself-comfortable-1427746605.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-ocolc-826746-1240020639.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-orlando-bedoya-site-wikipedia-org-site-wikimedia-org-1629326434.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-pareques-site-hu-wikipedia-org-1647941362.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-sarah-monfort-wikipedia-1647374906.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-scholar-a-tumeo-m-branca-l-camerini-a-dual-priority-realtime-multiprocessor-system-on-fpga-for-automotive-ap-1614181186.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-scholar-muhammed-rashid-1656890873.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-scholar-w-fan-j-li-s-ma-n-tang-and-w-yu-april-2012-towards-certain-fixes-with-editing-rules-and-master-data-1614165399.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-scholar-wan-y-menon-s-and-ramaprasad-a-2009-the-paradoxical-nature-of-electronic-decision-aids-on-comparison-1614187144.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-susan-boyle-make-me-a-channel-of-your-peace-1607791072.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-taikoo-hui-mandarin-oriental-hotel-guangzhou-1652086766.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-why-is-one-foot-slightly-larger-than-the-other-one-1605140430.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-win10-iso-xia-zai-1577717811.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-www-boston-hotels-cheap-net-1062123561.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-www-exactresult-com-1062373767.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-www-wallstquotes-com-1062140693.approved.txt
data/manual-annotations/archived-raw-serps/expected/google-zombie-apocalypse-1565114134.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-0609265-s-nm-1329020836.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-angelina-jolie-1452700725.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-dogville-1187303706.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-gundula-rapsch-1628094679.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-hunger-games-1518585690.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-marcela-gomez-montoya-1614546944.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-murder-world-1268209692.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-pulse-1283006912.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-sam-claflin-1472223834.approved.txt
data/manual-annotations/archived-raw-serps/expected/imdb-the-expanse-1521743964.approved.txt
data/manual-annotations/archived-raw-serps/expected/imgur-search-term-string-1547858079.approved.txt
data/manual-annotations/archived-raw-serps/expected/imgur-search-term-string-1565643838.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-60000-1450529560.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-concept-development-integration-1647187061.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-customer-service-1447983624.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-hca-corporate-1334425152.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-higher-education-freelance-network-1585036169.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-international-english-prep-academy-iepa-1586237411.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-jvm-lending-1586272513.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-origins-macy-s-1353165507.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-pepsico-1487893385.approved.txt
data/manual-annotations/archived-raw-serps/expected/indeed-steiner-business-solutions-1577184429.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-1368578723.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-ch-1382528052.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-che-zai-cd-1507664971.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-dao-tian-1442736754.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-guan-yin-liao-1501752634.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-iu-vdun35358z-1537907650.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-ji-guang-da-yin-1516054404.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-mo-yan-1516163665.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-qing-shang-1510505248.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-sha-tan-ku-nan-1446537277.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-shlrwanh-uq-2179706936-1473350033.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-song-yan-1434320372.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-tai-kong-zhen-1508948206.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-tuan-dui-guan-li-1429813603.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-weiwei776699e-1537978473.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-xian-xing-dai-shu-1497236213.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-yang-hong-wei-1429640037.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-you-xi-1511265243.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-yu-diao-jiu-ning-meng-1601078153.approved.txt
data/manual-annotations/archived-raw-serps/expected/jd-yxingaiujliu-xwcp198-1537926187.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-cryptocurrencies-1556702372.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-g-d-goenka-international-school-surat-wisdom-valley-campus-nr-anuvrat-dwar-new-city-light-road-rcc-c-1568400864.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-g-d-goenka-international-school-surat-wisdom-valley-campus-nr-anuvrat-dwar-new-city-light-road-rcc-canal-road-bar-surat-gujrat-1568400864.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-james-margolin-fbi-1571382052.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-parent-information-center-of-nj-https-www-linkedin-com-feed-1537815970.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-parent-information-center-of-nj-https-www-linkedin-com-search-results-all-keywords-parent-informatio-1537815969.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-parent-information-center-of-nj-https-www-linkedin-com-search-results-all-keywords-parent-information-center-of-nj-1537815969.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-test-1563279735.approved.txt
data/manual-annotations/archived-raw-serps/expected/linkedin-vizthink-1229875736.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-10559239-974530320.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-11548566-973003263.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-dpsxmfl-1632292908.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-geobugseon-1439284748.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-heolkeu-dari-gajin-namja-1397449417.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-junggangosagongbu-1627424756.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-monteria-montheria-bunyupoteu-jeongitipoteu-jeongijujeonja-bunyupoteugi-1200ml-1200mlpingkeu-hugi-1640713881.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-sejongmunhwahoegwan-daegeugjang-1652993423.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-t-1047137339.approved.txt
data/manual-annotations/archived-raw-serps/expected/naver-z-974687640.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-12-1565436858.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-brazilian-carnival-1378864891.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-cfnm2-1271707129.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-full-porno-films-1633148146.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-kardashian-1232246712.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-mini-skirt-1257166127.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-org-1219567054.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-roxy-reynolds-1222496976.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-stripping-1627962626.approved.txt
data/manual-annotations/archived-raw-serps/expected/pornhub-teen-facial-1237526884.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-danil-kozlovsky-1360453772.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-erin-1359911760.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-feng-mi-lian-1380895166.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-hua-ze-xiang-cai-1408309927.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-james-boshier-1449178049.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-ji-lin-yan-ji-1360789033.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-ji-zhou-dao-ttglao-hu-ji-ping-tai-guan-wang-x-fa33n-comx-1488991663.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-jie-ke-luo-de-wei-er-1445892389.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-jin-cheng-wu-1319745059.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-jin-xiu-long-1320298924.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-lin-xi-tong-1507483207.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-niamh-cusack-1319751306.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-shen-shan-zheng-er-lang-1405119212.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-statue-1536122094.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-tag-encode-1341871817.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-turn-that-finger-around-1324266860.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-xing-xing-di-qiu-2-1582812539.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-zhang-dong-jian-1446133153.approved.txt
data/manual-annotations/archived-raw-serps/expected/qq-zhong-nian-wei-ji-1408289827.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-administrateur-general-du-cnam-1619206522.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-allades-1631959376.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-anna-sottilotta-1630417705.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-another-word-for-less-likely-1641721403.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-attaque-a-tunis-1433356632.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-bluestacks-keyboard-not-working-1637463746.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-celine-de-roany-1640557696.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-code-9-1661507082.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-danse-1460250714.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-david-shepard-restaurateur-de-film-1595246740.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-dr-heim-tampa-1631748962.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-dr-michael-valliere-1653406352.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-drapeau-canadien-1615473541.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-eric-singer-drums-1621083357.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-festival-corazon-latino-1644332358.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-fredrik-lundberg-1665847606.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-geographie-de-la-france-1620931197.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-great-falls-gun-club-1637348184.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-guerre-froide-1654846351.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-hovelhof-1461470750.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-i-squared-capital-linkedin-1653657436.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-initialiser-debat-dadmissibilite-1645273237.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-jesus-mendez-facebook-1642962807.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-journee-nationale-du-drapeau-gabonais-1628405454.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-lemke-software-gmbh-1625227146.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-lombocruralgie-francais-1656441384.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-marcel-caya-1628794563.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-metal-slug-foo-1624572900.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-musique-folklorique-bretonne-1631820741.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-neonazis-en-france-1663085614.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-obs-keyframe-interval-1657322209.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-ouat-once-upon-a-train-1643380520.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-phantasialand-1461344566.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-que-tal-magazine-1643474954.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-rmvmn-1619293679.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-rob-diamond-movies-1626693763.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-rosa-linux-1664389965.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-sacred-age-odysseria-1652523638.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-skerdi-dervishaj-1635917093.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-sporting-stadium-1640362241.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-steam-ubuntu-wiki-1592725715.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-the-owl-club-1666374443.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-toddlercon-1579361594.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-trouve-arc-bf4-1625314405.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-tv-horror-movies-chart-1667140806.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-unification-album-1626264528.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-victoria-zdrok-1632510384.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-volt-bulgarie-1628499772.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-what-is-beowulf-about-summary-1659304409.approved.txt
data/manual-annotations/archived-raw-serps/expected/qwant-world-deutsch-regional-europa-deutschland-baden-wurttemberg-landkreise-heilbronn-stadte-und-gemeinde-1626329085.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-3ds-1364668924.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-b7-1650853917.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-flair-already-posted-https-redd-it-xamfzl-1667030236.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-german-nebelmittelwurfanlage-1664557458.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-how-can-i-access-nature-com-articles-1666041985.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-jailbait-1376244913.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-supermoon-1403887175.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-teleperformance-1260472045.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-touch-meme-1663170731.approved.txt
data/manual-annotations/archived-raw-serps/expected/reddit-typetest-10fastfingers-1663797626.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-build-to-survive-black-people-1663785067.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-chernobyl-rp-1666555966.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-cut-1633682743.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-shorts-1357668619.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-soviet-union-1657601847.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-survival-1656759229.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-survive-the-killer-1640549700.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-welcome-to-the-town-of-robloxia-uncopylocked-1660007534.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-xo-so-88-gg8-run-1659417607.approved.txt
data/manual-annotations/archived-raw-serps/expected/roblox-znation8000-1650350926.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-cesuk-163163163-cn-1493482889.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-eed-1-4a1-a-1332923188.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-j-1341637724.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-ju-min-shen-fen-zheng-hao-ma-he-xing-ming-1508756794.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-l-1346233371.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-lofke-yi-kua-shi-chang-mai-mai-1333092705.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-ti-gong-jin-kou-qi-qiang-1647324224.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-tu-guan-xin-gai-kuan-1332227339.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-xing-ai-ji-qiao-1576522689.approved.txt
data/manual-annotations/archived-raw-serps/expected/sogou-yuan-dai-ma-xie-lu-1578201651.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-fonts-swing-jtextpane-1412916125.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-numpy-einsum-1516773912.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-objective-c-1354546520.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-remote-execution-1645839151.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-ruby-1-9-3-heroku-1398351399.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-ruby-on-rails-plugins-1613971498.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-scala-1355718931.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-text-mining-1522322354.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-vue-js-php-1647710017.approved.txt
data/manual-annotations/archived-raw-serps/expected/stackoverflow-xampp-java-1547581001.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-linkid-js-1533168227.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-peringatan-dini-bmkg-kamis-18-februari-2021-1632679908.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-pilgub-dki-jakarta-2017-1491952670.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-polsek-tallo-1663047668.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-ricky-natapradja-1663049121.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-search-term-string-1607106977.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-search-term-string-1607120098.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-search-term-string-1607130238.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-search-term-string-1607224881.approved.txt
data/manual-annotations/archived-raw-serps/expected/tribunnews-search-term-string-1607225592.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitch-a-plague-tale-innocence-1638358324.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitch-central-fluminense-1630540704.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitch-cpentagon-1640060311.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitch-juliversal-1629750531.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitch-rubberboy2001-1661349876.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitch-simplevar-1662753027.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitch-xxlillythefallenangelneko-1638019769.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-campaigns-1481768285.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-clubs-lang-sr-1591413117.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-ecotourism-1557315321.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-freemariabutina-1555124003.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-freemariabutina-1562498575.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-freemariabutina-1563062689.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-http-shop-pre-com-corona02-p-409033-1648579256.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-lauramajor-1652839406.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-rabble-ca-lang-ar-1442999332.approved.txt
data/manual-annotations/archived-raw-serps/expected/twitter-rabble-ca-lang-fr-lang-id-1443046297.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-000-space-marine-1363614912.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-grot-1353834377.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-gta-1389323282.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-imperatory-illiuzii-1387125239.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-loco-roco-1377325114.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-muzyka-1372304839.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-rabotaiu-na-sebia-1361533546.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-radioelektronnye-sistemy-1361402773.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-sportivnye-mototsikly-1387080107.approved.txt
data/manual-annotations/archived-raw-serps/expected/vk-technology-1383988940.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-bu-xiang-jiao-hun-li-de-fen-zi-qian-refer-focus-lx-stopic-box-1527256388.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-fu-cai-3dshu-ju-jia-wei-xin-xw639-2018-1555261848.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-hun-li-li-jie-refer-stopic-box-1505917853.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-ji-huo-ma-b-1-page-2-1433297692.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-kan-bu-jian-de-yan-pi-1409920649.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-li-wei-yi-refer-user-weibo-1517733046.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-meng-lin-dexiao-wu-1437753277.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-quan-ye-cha-page-13-1517932436.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-sheng-fu-lang-xi-si-1603546157.approved.txt
data/manual-annotations/archived-raw-serps/expected/weibo-xiao-xiao-bin-refer-stopic-box-1518290095.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-ao-xian-yu-le-du-bo-ping-tai-1430758639.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-figures-in-theatrical-costumes-claude-gillot-1673-1722-class-photo-description-french-painter-drawer-1632572254.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-group-portrait-on-doorstep-collins-tudor-washington-1898-1970-photographer-75426-object-number-haswb-1629837781.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-la-dian-zi-ji-1517046182.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-mou-lin-han-site-pku-edu-cn-1576868395.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-nito-1655733503.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-oxygen-1596274448.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-prob-1543207125.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-recaptchalogo-svg-1509131182.approved.txt
data/manual-annotations/archived-raw-serps/expected/wikimedia-zao-can-bao-zi-jia-meng-www-baidu-com-aaaa-4ws-2018nian-8yue-4ri-21shi-19fen-39miao-1537939782.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-casey-cavert-go-to-www-lovesbo-ru-1642784433.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-claire-dames-1325320932.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-drunk-1325431509.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-escola-sao-luis-1657929903.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-evander-marius-go-to-www-lovesbo-ru-1642716634.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-free-hardcore-porn-videos-japanese-video-1428541087.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-gay-peeing-porn-go-to-www-lovesbo-ru-1643357466.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-gay-whitezilla-go-to-www-lovesbo-ru-1643416941.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-robber-1248193170.approved.txt
data/manual-annotations/archived-raw-serps/expected/xvideos-solo-1341894522.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-ashland-oregon-1015423512.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-bc-gov-971492707.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-bill-callahan-american-football-1636808341.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-castle-heights-angeles-1611631735.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-civil-code-1658358754.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-dating-sites-1647656764.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-diver-lg-u8180-1620023310.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-dunwells-army-of-friends-1617218301.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-envious-that-biden-1652739375.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-every-previewsworld-calls-1649106369.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-free-mail-centers-970285370.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-free-nude-pics-of-brittney-spears-970473571.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-free-pics-bbbw-1041625676.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-free-xxx-asian-pics-952102259.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-freeware-936293306.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-fresh-prince-of-bel-air-971413040.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-frugal-994624570.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-fruitarianism-970289154.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-full-speed-1011203807.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-funny-970842855.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-funny-pictures-943791338.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-futurama-1314932107.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-future-of-sport-971016077.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gabel-970409689.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gaelic-970435492.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gamefaq-970449707.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-games-970945905.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-games-puzzles-brain-teasers-sudoku-1574052323.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-games-video-games-developers-and-publishers-croteam-1624838167.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gamespot-portugal-1036145291.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gaming-club-997142327.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-ganze-filme-online-schauen-kostenlos-und-in-voller-lange-1376615487.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gay-shower-sex-961542771.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gender-discrimination-970694307.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-general-s-daughter-the-970749419.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-genserv-971364933.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-george-foreman-boxer-1040476713.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-georgetown-university-law-center-970779220.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-georgia-restaurant-association-970314665.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-german-pen-pals-961119166.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-ghar-1005251824.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-ghulam-sarwar-khan-1626337646.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gina-mckee-998889511.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-girlsandanimals-1039016411.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-glass-tools-961515348.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-global-and-parts-970542388.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-goddess-955975798.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gogi-grant-1041483222.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-golden-books-971368161.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-golf-poll-971193897.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-golson-1017320115.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-gordon-bruce-955082521.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-govote-com-955100292.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-hombres-con-pelo-en-el-pecho-photos-1359853955.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-isnt-even-weirdest-thing-america-right-1653343893.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-jello-gelatin-971145484.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-john-mccain-956454509.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-lawyer-career-information-970996615.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-learn-to-focus-1619373855.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-lm-1376048795.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-mark-schlissel-wife-1642367070.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-metallurgi-1042532635.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-molly-shannon-1640079691.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-region-de-coquimbo-970960857.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-sam-bush-1016625678.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-telekwiaciarnia-pl-1436841282.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-trans-texas-corridor-1613259804.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-wheatstone-bridge-1613009822.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-world-greek-kata-periokhe-boreia-amerike-kanadas-1647085990.approved.txt
data/manual-annotations/archived-raw-serps/expected/yahoo-world-hebrew-hbrh-shlvm-1489427128.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-danses-tv-periodic-1534841786.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-niusha-1515577404.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-speed-force-1535895408.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-speed-force-1535955246.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-speed-force-1535970436.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-speed-force-1535973684.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-speed-force-1536042339.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-speed-force-1536100368.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-spirited-away-animated-film-2001-1524478207.approved.txt
data/manual-annotations/archived-raw-serps/expected/yandex-virat-swaroop-1523992633.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-ampatuanmassacre-1583309425.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-cardistry-asmr-1577113546.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-chaoz-time-1652155691.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-chto-budet-esli-sobrat-vse-rezinki-v-bully-1599555287.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-hp-probook-640-g1-razborka-1579996098.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-kak-sdelat-vzryv-v-cinema-4d-1578732009.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-kak-vybit-dushu-moba-1599057231.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-kutyaplya-1561171748.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-lataji-1563086980.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-literatura-6-klass-biografiia-pushkina-1595705363.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-ne-prosto-bekkhen-reaktsiia-1582514079.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-pora-tiulpanov-aktery-1574991226.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-prokhozhdenie-igry-madagaskar-2-chast-4-1562167916.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-pudding-1563068696.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-q2-2017-arizona-west-regional-1547871680.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-razbor-shchetki-pylesosa-samsung-1584184489.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-robloks-mip-siti-2019-1583715307.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-shang-yue-xian-ru-pu-1582390054.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-shang-yue-xian-rupu-1582390054.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-uzbekskaia-svadba-v-shymkente-1574145605.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-vasilii-emelianenko-tefteli-1578285143.approved.txt
data/manual-annotations/archived-raw-serps/expected/youtube-zadnii-most-moskvich-412-ustroistvo-1584150216.approved.txt
data/manual-annotations/archived-raw-serps/warcs/360-21tian-jian-fei-fa-1653652529.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-an-jian-diao-cha-bi-lu-1576497545.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-chen-teng-tan-han-han-mei-ren-jie-ji-1577810108.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-duo-jia-ju-chang-qu-xiao-yan-chu-1579663841.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-hui-ji-pei-xun-1579668897.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-jin-ji-che-hui-1576637402.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-ju-min-jia-zhong-fei-jin-bian-fu-1585788499.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-lu-xing-she-tuan-dui-you-zan-ting-1580014331.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-mao-bu-yi-xiao-chou-chao-xi-1576791478.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-mei-guo-qian-zheng-1579954288.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-niu-jie-5hao-1576819311.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-shi-jie-zui-ai-de-ren-qu-shi-1579483438.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-si-chuan-fa-sheng-6-8ji-di-zhen-1662384982.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-site-chaxun-biz-1550145271.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-site-chaxun-biz-1550161171.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-site-chaxun-biz-1551742698.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-site-eng-kaz-enacademic-com-1581787441.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-tao-bao-ru-he-che-hui-ping-jie-1576604187.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-wu-xiu-bo-yang-kun-ju-hui-hai-ge-1577858222.warc.gz
data/manual-annotations/archived-raw-serps/warcs/360-zhang-bo-zhi-bei-gou-yao-shang-1661090641.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-barefoot-accessories-1508385234.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-children-school-bag-1388612710.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-jewelry-sets-1390214039.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-kids-wear-1293514157.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-q5-phone-1374387535.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-sterling-silver-gemstone-1384701071.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-sterling-silver-pandora-charms-1457090417.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-transmission-shaft-1435605057.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-waterproof-winter-boots-women-1500418630.warc.gz
data/manual-annotations/archived-raw-serps/warcs/aliexpress-women-messenger-bags-1397198302.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-deng-shi-jia-meng-www-baidu-com-aaaa-oq1-2018nian-8yue-19ri-19shi-32fen-18miao-1564357198.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-dnd-flash-mosquito-1633240377.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-eksa-1662208504.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-gaming-monitor-1639065822.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-guang-huaiba-pawameta-1632443655.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-gym-mat-tile-1634791656.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-joseph-menn-1605789427.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-lovense-1618431049.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-monitor-1625069899.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-notebook-dell-1613232661.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-omega-labyrinth-z-1616510370.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-pillow-fsa-1615964514.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-qian-lian-mo-hua-orizinarusaundotoratsuku-1657685343.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-solefit-1663015835.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-tazas-te-transparente-1613035337.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-the-montells-you-can-t-make-me-1617199271.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-the-risks-of-prescription-drugs-1657820625.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-under-armour-socks-1553107494.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-yangumagazin-yanmagasado-1625727694.warc.gz
data/manual-annotations/archived-raw-serps/warcs/amazon-zao-dian-jia-meng-pin-pai-www-baidu-com-aaaa-zv9-2018nian-8yue-21ri-17shi-49fen-4miao-1564430721.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-afraid-of-women-1172618037.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-apologist-1172369538.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-are-alkali-metals-lighter-than-water-1619387309.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-batman-movie-1467834503.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-big-tex-trailer-for-sale-1649774735.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-boxer-ear-crop-1173516809.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-caring-1173637789.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-cell-biology-1173639673.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-cure-for-boredom-1174210645.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-date-guy-fawkes-death-1173527460.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-diaframma-contraccezione-lang-it-1175070504.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-dog-ear-design-1172708874.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-fachkunde-metall-fur-ausbildung-in-maschinenbauberufen-1461053109.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-facula-site-www-wordreference-com-1173391757.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-failures-of-president-lincoln-1611567628.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-faither-site-www-accringtonweb-com-1173391901.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-five-phases-of-mitosis-1173539024.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-free-grammer-test-for-employment-1443411312.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-genus-falco-1172718376.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-http-my-notes-on-blogspot-com-1401243816.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-i-ve-site-news-bbc-co-uk-1172693923.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-if-you-break-a-fluorescent-light-bulb-1618021531.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-interior-design-classes-online-1651218822.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-japanese-airlines-1173622069.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-lopsided-site-www-usatoday-com-1173623642.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-meaning-of-integral-site-www-elook-org-1174247342.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-means-mutable-site-www-geek-interview-comrview-com-1173713625.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-means-mutable-site-www-geekinterview-com-1173392177.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-names-of-reggae-artists-1173527903.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-old-fashioned-labels-1172720557.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-olympic-rings-1172716332.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-perfect-first-date-1180217842.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-peter-krogh-photographer-1184320758.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-preparation-of-offal-1172710460.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-radioactivity-in-medicine-1173728275.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-rhino-records-1173555865.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-saiy-phiohom-1525375661.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-scorch-removal-1172719147.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-smirnoff-label-1173377085.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-tie-dye-patterns-1446417858.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-tye-dye-instructions-1446417925.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-vitamins-good-after-expiration-date-expires-site-www-cfs-purdue-edu-1173531858.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-weather-report-for-22903-1489829020.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-week-names-1173639143.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-what-s-california-s-state-bird-1175130217.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-what-should-i-wear-on-the-first-day-of-school-1442349823.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-what-words-rhyme-with-afraid-1173540494.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-whelped-definition-1173526805.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-who-framed-roger-rabbit-1473167643.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ask-www-ksu-edu-sa-1182367717.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-e-eeeae-1522165852.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-e-eeeae-1544443888.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-e-eeeae-1547510808.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-e-eeeae-1554431691.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-e-eeeae-1558963051.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-e-eeeae-1567878230.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-e-eeeae-1569971117.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-eru-1525597474.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-lian-xi-qu-dian-nao-pei-xun-1643390077.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-lian-yun-gang-qi-yang-yue-zi-hui-suo-zhong-xin-jing-zhun-ke-hu-ying-xiao-key668-cn-1537259978.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-long-feng-qu-qi-quan-qi-huo-pei-xun-1642853767.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-long-shi-liang-1639014949.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1549835769.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1553838201.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1558979495.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-mao-kui-lu-mao-cong-cong-mao-ning-kui-mao-dan-dan-mang-lu-1564025418.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-mao-ning-kui-mao-dan-dan-mang-long-lou-mang-lu-shikato-1537858258.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-sexinsex-1-2-1213858525.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-shang-hai-11xuan-5ding-dan-wei-xin-weiwei776699-1545685930.warc.gz
data/manual-annotations/archived-raw-serps/warcs/baidu-zhong-guo-lian-tong-smsc-1372160086.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-100-9-classic-country-radio-station-alaska-1660338459.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-1137ce-1639788231.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-1968-cougar-on-craigslist-1480218715.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-agent-077-mission-bloody-mary-movie-1593376539.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-aldershot-news-1629564105.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-allovercr-1423275634.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-arab-suck-and-fuck-bouchra-1365405319.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-blockbench-github-1652298697.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-christian-r-ntizimira-1607730426.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-classement-de-la-premier-league-1658725630.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-clay-andrews-1649253287.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-clobetasol-without-prescription-1615178898.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-cody-machan-facebook-1594008363.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-common-use-facilities-1643636012.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-computers-software-presentation-1488623366.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-connecticut-covid-deaths-1628019384.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-corner-app-1618998889.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-countercyclical-fiscal-policy-1643622693.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-crimson-coward-1640789839.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-customer-service-phone-number-for-hp-printer-1662986585.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-dan-robitzski-1660531082.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-dash-investment-foundation-1644415217.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-dataquantum-com-vancouver-hosting-1375879464.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-eero-pro-mesh-wifi-system-1659437763.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-elon-musk-tesla-stock-drop-1656685094.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-european-cannibalism-1591185526.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-explore-with-us-youtube-emma-1651605205.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-florence-caillon-bandcamp-1647897680.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-great-blue-heron-sound-1660552923.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-harukazewakaba0-1643181401.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-herzlich-willkommen-unterbindet-den-storeinfluss-bei-psychosen-1650332555.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-intel-i7-chip-1656625238.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-kumolife-1388896361.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-kutuklui-affair-1643643819.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-lake-wappapello-state-wildlife-area-1643615402.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-libyan-syrian-union-1643642965.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-limbpower-1640025328.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-limited-range-icbm-1643649846.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-mehmet-oz-florida-hunting-license-1657728564.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-mesozoic-wikipedia-1643229373.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-mighty-music-1578065758.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-nexus-mods-manager-1662582175.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-obama-speech-1274497739.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-regional-asia-taiwan-localities-taichung-city-1580952978.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-rpg-title-screen-1656104004.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-shang-chi-film-1563662560.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-sungard-1555022695.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-sweden-riots-1618569435.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-team-liquid-teams-1652030641.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-the-clavarioid-fungi-of-new-zealand-ron-petersen-1556393373.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-uscis-forms-400-1486690408.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-vintage-pittsburgh-steelers-steel-curtain-1497160668.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-wikipedia-orb-univers-de-fiction-1643880033.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-wikipedia-port-de-gennevilliers-metro-de-paris-1604443017.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-wikipedia-privatbrauerei-hoepfner-1620534005.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-wikipedia-rock-macabre-1603539954.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-wikipedia-sider-tribu-1593501017.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-wikipedia-vesuvius-1641311740.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-win10-iso-xia-zai-1580349240.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bing-wonder-kids-beginning-1652132287.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-asslicking-1623701105.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-camshow-1653633300.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-cock-sucking-1617355851.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-facial-1578106424.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-fucking-1577494848.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-hd-plus-1576443879.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-massage-1604010948.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-stripping-1623091287.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-stripping-1648087966.warc.gz
data/manual-annotations/archived-raw-serps/warcs/bongacams-teasing-1635992326.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-67-degrees-c-static-atmosphere-1665006071.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-a2z-chip-1632000373.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-advanced-search-query-1667410105.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-amoled-1646168352.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-ape-1648509867.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-apple-t3-chip-1651405075.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-avnon-dan-1998-martin-buber-the-hidden-dialogue-lanham-boulder-new-york-oxford-rowman-littlefield-1649576842.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-best-notetaking-app-1654643212.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-bivoks-trebehandling-1654325149.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-chomikuj-1656776694.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-copyq-1665902945.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-cubecraft-skyblock-pig-farm-1664124008.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-dark-brown-mushrooms-that-melt-in-to-the-ground-1657827723.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-fastest-otto-guide-1649849902.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-froggy-pool-1651139840.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-google-play-store-1649985658.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-greentext-1664484724.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-h-m-home-1664916031.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-house-building-cost-estimate-1664320455.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-how-to-archive-mac-notes-1658260525.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-how-tot-ell-if-tail-recurssive-1658814198.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-import-esbuild-from-esbuild-syntaxerror-unexpected-identifier-1652662700.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-indiana-vaccine-passport-ban-1629877535.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-jinniebella-1666397597.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-kymatica-1652976922.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-logitech-1661137612.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-maintenance-1661082520.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-masi-uno-riser-chain-cover-1658006343.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-metaverse-1650224042.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-nair-1666404375.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-new-fold-4-1657628120.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-new-mac-os-release-1664483322.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-nvfbc-1651575025.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-openoffice-1667290210.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-pekara-fontana-niksic-1649235416.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-pizza-box-1662098145.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-product-life-cycle-definition-1664819445.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-random-number-python-1649475875.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-rent-1647905724.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-safemoon-1653585598.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-spigot-1660718390.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-terraform-github-container-1666470147.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-testimonies-project-1653158644.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-tina-daunt-1652776164.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-troll-1649987736.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-unremovable-1650484694.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-usb-3-1-type-c-dp-alt-mode-1667002333.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-utilitx-1659649168.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-video-1649793956.warc.gz
data/manual-annotations/archived-raw-serps/warcs/brave-virtualbox-extensions-1667278528.warc.gz
data/manual-annotations/archived-raw-serps/warcs/canva-instagram-reels-video-1607594697.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-35-backen-1351851992.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eier-milch-kse-kartoffeln-1318228714.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eier-parmesan-spinat-sahne-1206623203.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eier-spinat-pilze-1200619371.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eierflaumsuppe-1249321209.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eierlikr-gugelhupf-1203899612.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eierlikr-kirschkuchen-1243942587.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eierlikr-mit-kirsch-1375310772.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eierlikr-nachspeise-1255758312.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eierschwammerl-rahmsauce-1449833431.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eierschwammerl-und-gehacktes-1315110709.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-eifreier-hackbraten-1356156512.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-hhnchen-warme-1303285108.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-kirsch-1305195838.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-kohlroulade-gemse-1328779105.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-kseschnitzel-kse-1353053392.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-nudelsalat-mit-ei-1330099391.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-omas-blechkuchen-1355822404.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-roulade-braten-1355445937.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-sahne-und-himbeeren-1192658021.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spaghetti-eis-torte-1342866905.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spaghetti-hhnchen-1192740442.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spaghetti-mit-gemsesauce-1190132272.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spaghettie-mit-garnelen-1206750318.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spaghettitorte-vom-blech-1369060560.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spaghettoni-1206569039.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spanische-salat-1192556276.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spargel-geschlt-1278411144.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spargel-m-soe-1280861753.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spargel-risotto-mit-garnelen-1471699836.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spargel-wei-1194284442.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-speck-n-dicken-1370169101.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-speck-zucchini-eier-sahne-1222747904.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-speckbohnen-mit-kartoffeln-1352170361.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-speisestrke-sahne-1232351646.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-spinat-in-1220295440.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-streuselkuchen-aus-mrbeteig-1299585024.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-suppen-oder-eintpfe-1256106491.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-sushi-mit-normalem-reis-1470947014.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-syrische-pasta-1466000049.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-tabouleh-rosinen-1382360347.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-tatar-steak-1266004316.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-tempura-1213419780.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-thai-curry-1246123954.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-thai-curry-einfach-1420408232.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-thailndisch-1313401080.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-thermomix-gefllten-1390802313.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-tomaten-mozarella-reis-1317162887.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-tupperware-hefe-1356254719.warc.gz
data/manual-annotations/archived-raw-serps/warcs/chefkoch-walnussl-dressing-1403236002.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-achievable-possibility-1642416655.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-apple-watch-2016-1662575890.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-biteukoinsaryeomyeon-www-99m-kr-bei-biteukoinsaryelie-biteukoinsaeobbbiteukoinsaeobjadeungrog-biteukoinsayongbangbeob8reduplicate-1647153716.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-dxa-1634498874.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-kindly-check-1642508434.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-march-4-1633908556.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-north-dakota-coronavirus-1632793271.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-skilled-1643388398.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-trigger-1638271567.warc.gz
data/manual-annotations/archived-raw-serps/warcs/cnn-wright-1616229078.warc.gz
data/manual-annotations/archived-raw-serps/warcs/csdn-android-studio-1660487187.warc.gz
data/manual-annotations/archived-raw-serps/warcs/csdn-fifo-1663204137.warc.gz
data/manual-annotations/archived-raw-serps/warcs/csdn-rows-1665572662.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-145-lbs-to-kg-1664351690.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-150-degrees-to-radians-site-degreestoradians-net-1662073498.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-2-5-muiles-to-km-1648676868.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-2022-07-12-23-00-site-www-time-time-net-1657640396.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-25-c-to-f-site-www-metric-conversions-org-1655636638.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-32168-weather-radar-1667504070.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-3rd-party-twitch-chat-1642095474.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-40-mile-creek-trail-site-www-arizonahighways-com-1657173375.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-branch-conventions-git-site-social-msdn-microsoft-com-1664392383.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-breaking-news-on-sierra-leone-1663541702.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-broken-reality-steam-site-www-huntmar-com-1597289631.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-buck-showalter-seinfeld-1654420295.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-build-chest-freezer-site-www-quora-com-1654893310.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-bulk-copper-pennies-for-sale-1646606334.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-burnout-paradise-online-multiplayer-with-all-dlc-site-www-counton-org-1655566858.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-c-pretty-print-json-1662310061.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-elite-dangerous-covas-site-www-pcgamer-com-1653704722.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-elite-dangerous-site-www-thegamer-com-1658908937.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-elton-john-site-www-esquire-com-1657307467.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-emoji-pedia-site-www-youtube-com-1590838578.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-empure-site-empure-in-1664600213.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-encountered-conflicts-when-cherry-picking-commit-1618189582.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-enneagram-test-site-www-crystalknows-com-1638683347.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-equation-of-dissociation-of-sulfuric-acid-site-www-sciencedirect-com-1649296927.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-erik-erikson-s-theory-site-positivepsychology-com-1654620203.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-gimp-use-align-tool-site-thegimptutorials-com-1653712700.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-jeanne-d-arc-site-id-wikipedia-org-1655183773.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-llanelly-carmarthenshire-wales-1655261859.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-newest-call-of-duty-game-1653477001.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-quit-telnet-site-www-codegrepper-com-1665105234.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-sheer-skirt-beach-thing-site-www-lyst-com-1653921398.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-sheets-site-www-kohls-com-1642928572.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-sheydim-site-www-sefaria-org-1664233097.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-simplify-subtraction-of-fractals-site-www-thecalculator-co-1637459222.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-sims-castaway-trailer-1647012563.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-u-team-1636548723.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-ubuntu-mesa-intel-r-hd-graphics-620-kbl-gt2-site-forum-unity-com-1658976095.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-ubuntu-netplan-package-site-www-ubuntuupdates-org-1665115336.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-ukraine-site-www-cfr-org-1646796603.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-united-reformed-churches-in-north-america-1446324275.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-universal-logs-checker-1-1-0-site-cracking-org-1656559962.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-update-admx-files-on-domain-controller-1660061931.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-waldo-s-chicken-site-waldoschicken-com-1654372116.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-warren-hunt-1635806147.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-waterford-house-erfstadt-court-wokingham-berkshire-rg40-2yf-google-maps-1660892879.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-we-acknowledge-the-traditional-custodians-of-the-land-on-which-our-office-stands-the-wurundjeri-peop-1654920640.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-webassembly-browser-support-list-1653198525.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-website-sitemap-finder-site-seositecheckup-com-1614287233.warc.gz
data/manual-annotations/archived-raw-serps/warcs/duckduckgo-what-happened-to-greta-thornburg-1667535932.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-1-4-1566151598.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-hu-bei-kuai-san-zhong-jiang-zhu-shou-jia-wei-vxin-weiwei776699-1548361753.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-imaginext-batman-motorcycle-1597143554.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-liu-he-cai-2o2526-wei-xin-weiwei776699-1562672411.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-liu-he-cai-gua-pai-wan-zheng-ban-wei-vxin-weiwei776699-1565563054.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-se-xing-mei-jia-wei-vxin-dun35358-1544323503.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-shan-dong-11xuan-5-360cai-piao-wei-xin-weiwei776699-1538125942.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-smartphones-1334931269.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-srch-str-1641320481.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ebay-victoria-s-secret-1559541146.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-8-ft-to-cm-1629639998.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-average-amount-of-photos-you-could-take-on-a-camera-in-1940-s-1572660962.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-barnes-1636235793.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-by-talos-this-cant-be-happening-1630519906.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-can-you-show-smoking-on-tv-1624555764.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-coding-freelancing-1634534706.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-correct-way-to-wash-hair-oily-scalp-1588676008.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-dall-e-1654952788.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-deaf-community-1626760345.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-financial-risk-tolerance-quiz-1643759873.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-foot-to-centimeter-1612629786.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-form-1694-instructions-1635977208.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-free-file-sharing-services-1638926359.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-fudanshi-1655238275.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-game-changer-classic-1638948940.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-git-create-pull-request-1655702772.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-gmail-sign-in-1637276050.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-gnome-desktop-entry-1655209403.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-google-image-scraper-1601781718.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-grady-white-ce-251-1636884788.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-h-and-m-clothing-sale-1635863133.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-hallam-f-c-1596174558.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-harry-styles-siblings-1634695267.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-health-conditions-and-diseases-neurological-disorders-meningitis-1666663445.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-high-functioning-depression-23w-1615448305.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-hisotry-of-tomato-in-india-23yt-1591696836.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-hm-219c-1637494750.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-how-much-doordash-driver-make-1654857157.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-how-to-be-more-generous-1590871266.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-how-to-check-if-a-value-is-null-in-c-1639813391.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-laughter-stories-1640836502.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-macglauglin-1640487447.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-percy-jackson-s-greek-gods-1634509308.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-saltpeter-beds-1643653808.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-sin-is-an-ugly-creature-1590737798.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-vasectomy-reversal-success-rate-23yt-1623229800.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-virtual-studio-code-download-for-windows-10-1642714491.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-watch-tv-series-23g-1602851877.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-we-will-rock-you-23yt-1587407460.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-west-point-nebraska-1644663254.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-what-does-god-do-to-tratorirs-1590883066.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-what-is-a-description-1655190914.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-what-s-the-shortest-war-ever-1635275630.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-where-are-my-chrome-extensions-1635276242.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-whiteman-afb-public-affairs-1636203076.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-why-can-t-you-order-international-nail-polish-online-india-23a-1586448930.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-windows-11-activator-reddit-1637172885.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-windows-for-workgroups-3-11-iso-1644191359.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-world-deutsch-regional-europa-deutschland-baden-wurttemberg-stadte-und-gemeinden-karlsruhe-1621530240.warc.gz
data/manual-annotations/archived-raw-serps/warcs/ecosia-world-deutsch-regional-europa-deutschland-hessen-landkreise-rheingau-taunus-kreis-stadte-und-gemeind-1595135090.warc.gz
data/manual-annotations/archived-raw-serps/warcs/espn-ball-state-1615730301.warc.gz
data/manual-annotations/archived-raw-serps/warcs/espn-ball-state-1619440827.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-andrew-kim-1566153959.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-embroidery-kit-1375805089.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-hard-plastic-1333819223.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-invitation-1367234841.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-pacifier-1336437253.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-pendants-1667648711.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-small-animal-1378528595.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-storage-and-organization-1632881953.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-sundress-1374472455.warc.gz
data/manual-annotations/archived-raw-serps/warcs/etsy-yan-dong-kuai-le-shi-fen-shou-ji-ban-jia-wei-xin-xw639-2018-1537911471.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-alda-lesbiennes-refugiees-1615284371.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-bernieorbust-1467812085.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-blog-post-319-je31-1567459151.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-blog-post-334-bootload-1567494170.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-cruzcrew-1459272010.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-deanna-sanchez-1629215596.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-greet-1623235952.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-https-peelarchivesblog-com-about-peel-1599241783.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-ineligible-1466870871.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-mens-health-survival-of-the-fittest-1619473718.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-mr-robot-1469187052.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-rosy-20gupta-1494524363.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-social-plugins-boutons-jaime-envoyer-partager-et-citations-js-exec-je31-1567485463.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-solcellespecialisten-1389488036.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-tag-someone-who-needs-this-1587554575.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-trumptrain-1461904486.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-vanilla-1481832838.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-virpi-soikkeli-1623257178.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-wisconsin-1463064570.warc.gz
data/manual-annotations/archived-raw-serps/warcs/facebook-www-9xcb-biz-webex-setup-was-unsuccessful-error-23-1404412853.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-jie-shi-de-jing-mi-gong-ye-you-xian-gong-si-1597737683.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-licensing-gethhwid-1662581846.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-mastodon-1657854340.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-org-zettlr-1591675518.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-subrock-1653099784.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-topic-bootswatch-org-sslcom-1552777180.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-topic-deprecated-org-bandwidth-fork-true-1634361552.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-topic-docker-stack-org-issuu-1549097482.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-topic-id-org-codercom-1553274306.warc.gz
data/manual-annotations/archived-raw-serps/warcs/github-topic-web-components-org-github-fork-true-1650012538.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-243-1628713922.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-a-tumeo-m-branca-l-camerini-a-dual-priority-realtime-multiprocessor-system-on-fpga-for-automotive-ap-1614181186.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-atalanta-bergamasca-calcio-wikipedia-1643703998.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-attack-on-titan-season-3-part-2-1556408967.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-bill-easley-sophisticated-prelude-1626498182.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-boulevard-records-canada-site-wikipedia-org-site-wikimedia-org-1510135498.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-bouncing-hero-switch-site-easyallies-com-1633303267.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-bozsa-bence-site-hu-wikipedia-org-1647787452.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-can-ju-ying-yu-1560296360.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-chi-zhen-nzhong-rong-keteru-1608917828.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-compress-tube-wikipedia-1644670761.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-coneybury-anomaly-wikipedia-1640176109.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-conflict-middle-east-wikipedia-1636797028.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-continental-automotive-systems-wikipedia-1651015350.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-crow-names-1608438374.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-diffusion-systems-for-evaluation-of-biomineralization-1618448715.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-does-steve-has-a-beard-1601705030.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-evan-colborne-1647984326.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-facebuster-1650197554.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-fatmira-brecani-1662136538.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-fer-palacio-1631069534.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-film-review-annual-1660769248.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-finance-1540158323.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-flop-thumbs-up-1568839345.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-focusrite-1641240556.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-forced-labor-in-california-1635373615.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-front-polisario-khat-al-shahid-1652852892.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-future-planning-1648480487.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-george-w-summers-1637786317.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-giulia-botti-1660836463.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-gnosticism-1615175612.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-grasshopper-design-pvt-ltd-1640249780.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-green-capital-energy-site-wikipedia-org-site-wikimedia-org-1657756151.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-green-wave-106-5-fm-1637281540.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-guntury-1650179158.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-hawaii-part-ii-lyrics-1633318830.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-hola-games-1552338270.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-kolex-1645947964.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-kostiantyn-magaletskyi-1638351261.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-kothuru-assembly-constituency-1631384737.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-kurabayashi-1643815267.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-kush-raval-indian-cricketer-site-wikipedia-org-site-wikimedia-org-1649726560.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-la-pipa-1635023533.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-lars-brygmann-1633135602.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-laxmikant-pyarelal-1657295550.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-leo-de-la-strehaia-1633884656.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-lige-gardner-1637042221.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-list-of-cantons-of-france-1634951028.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-list-of-crossings-of-the-james-river-1662064377.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-list-of-grand-dukes-of-russia-1645733808.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-list-of-surviving-lockheed-f-104-starfighters-1662745731.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-lope-recio-loynaz-1658853508.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-lucas-ruzin-1658326494.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-lucius-vibullius-rufus-son-in-law-of-herodes-atticus-1642439444.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-luiz-carlos-footballer-born-1980-wikipedia-1637131910.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-lycee-francais-louis-pasteur-de-lagos-1638831028.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-modern-times-chaplin-watch-online-1662343522.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-muhammed-rashid-1656890873.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-now-it-s-time-for-your-treatment-relax-make-yourself-comfortable-1427746605.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-ocolc-826746-1240020639.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-orlando-bedoya-site-wikipedia-org-site-wikimedia-org-1629326434.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-pareques-site-hu-wikipedia-org-1647941362.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-sarah-monfort-wikipedia-1647374906.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-susan-boyle-make-me-a-channel-of-your-peace-1607791072.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-taikoo-hui-mandarin-oriental-hotel-guangzhou-1652086766.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-w-fan-j-li-s-ma-n-tang-and-w-yu-april-2012-towards-certain-fixes-with-editing-rules-and-master-data-the-vldb-journal-21-2-213-238-297-10-1007-s00778-011-0253-7-1614165399.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-wan-y-menon-s-and-ramaprasad-a-2009-the-paradoxical-nature-of-electronic-decision-aids-on-comparison-1614187144.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-why-is-one-foot-slightly-larger-than-the-other-one-1605140430.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-win10-iso-xia-zai-1577717811.warc.gz
data/manual-annotations/archived-raw-serps/warcs/google-zombie-apocalypse-1565114134.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-0609265-s-nm-1329020836.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-angelina-jolie-1452700725.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-dogville-1187303706.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-gundula-rapsch-1628094679.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-hunger-games-1518585690.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-marcela-gomez-montoya-1614546944.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-murder-world-1268209692.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-pulse-1283006912.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-sam-claflin-1472223834.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imdb-the-expanse-1521743964.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imgur-search-term-string-1547858079.warc.gz
data/manual-annotations/archived-raw-serps/warcs/imgur-search-term-string-1565643838.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-60000-1450529560.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-concept-development-integration-1647187061.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-customer-service-1447983624.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-hca-corporate-1334425152.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-higher-education-freelance-network-1585036169.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-international-english-prep-academy-iepa-1586237411.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-jvm-lending-1586272513.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-origins-macy-s-1353165507.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-pepsico-1487893385.warc.gz
data/manual-annotations/archived-raw-serps/warcs/indeed-steiner-business-solutions-1577184429.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-1368578723.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-ch-1382528052.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-che-zai-cd-1507664971.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-dao-tian-1442736754.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-guan-yin-liao-1501752634.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-iu-vdun35358z-1537907650.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-ji-guang-da-yin-1516054404.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-mo-yan-1516163665.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-qing-shang-1510505248.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-sha-tan-ku-nan-1446537277.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-shlrwanh-uq-2179706936-1473350033.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-song-yan-1434320372.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-tai-kong-zhen-1508948206.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-tuan-dui-guan-li-1429813603.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-weiwei776699e-1537978473.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-xian-xing-dai-shu-1497236213.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-yang-hong-wei-1429640037.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-you-xi-1511265243.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-yu-diao-jiu-ning-meng-1601078153.warc.gz
data/manual-annotations/archived-raw-serps/warcs/jd-yxingaiujliu-xwcp198-1537926187.warc.gz
data/manual-annotations/archived-raw-serps/warcs/linkedin-cryptocurrencies-1556702372.warc.gz
data/manual-annotations/archived-raw-serps/warcs/linkedin-g-d-goenka-international-school-surat-wisdom-valley-campus-nr-anuvrat-dwar-new-city-light-road-rcc-canal-road-bar-surat-gujrat-1568400864.warc.gz
data/manual-annotations/archived-raw-serps/warcs/linkedin-james-margolin-fbi-1571382052.warc.gz
data/manual-annotations/archived-raw-serps/warcs/linkedin-parent-information-center-of-nj-https-www-linkedin-com-feed-1537815970.warc.gz
data/manual-annotations/archived-raw-serps/warcs/linkedin-parent-information-center-of-nj-https-www-linkedin-com-search-results-all-keywords-parent-information-center-of-nj-1537815969.warc.gz
data/manual-annotations/archived-raw-serps/warcs/linkedin-test-1563279735.warc.gz
data/manual-annotations/archived-raw-serps/warcs/linkedin-vizthink-1229875736.warc.gz
data/manual-annotations/archived-raw-serps/warcs/manual-google-1.warc.gz
data/manual-annotations/archived-raw-serps/warcs/manual-google-2.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-10559239-974530320.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-11548566-973003263.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-dpsxmfl-1632292908.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-geobugseon-1439284748.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-heolkeu-dari-gajin-namja-1397449417.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-junggangosagongbu-1627424756.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-monteria-montheria-bunyupoteu-jeongitipoteu-jeongijujeonja-bunyupoteugi-1200ml-1200mlpingkeu-hugi-1640713881.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-sejongmunhwahoegwan-daegeugjang-1652993423.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-t-1047137339.warc.gz
data/manual-annotations/archived-raw-serps/warcs/naver-z-974687640.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-12-1565436858.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-brazilian-carnival-1378864891.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-cfnm2-1271707129.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-full-porno-films-1633148146.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-kardashian-1232246712.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-mini-skirt-1257166127.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-org-1219567054.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-roxy-reynolds-1222496976.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-stripping-1627962626.warc.gz
data/manual-annotations/archived-raw-serps/warcs/pornhub-teen-facial-1237526884.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-danil-kozlovsky-1360453772.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-erin-1359911760.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-feng-mi-lian-1380895166.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-hua-ze-xiang-cai-1408309927.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-james-boshier-1449178049.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-ji-lin-yan-ji-1360789033.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-ji-zhou-dao-ttglao-hu-ji-ping-tai-guan-wang-x-fa33n-comx-1488991663.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-jie-ke-luo-de-wei-er-1445892389.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-jin-cheng-wu-1319745059.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-jin-xiu-long-1320298924.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-lin-xi-tong-1507483207.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-niamh-cusack-1319751306.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-shen-shan-zheng-er-lang-1405119212.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-statue-1536122094.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-tag-encode-1341871817.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-turn-that-finger-around-1324266860.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-xing-xing-di-qiu-2-1582812539.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-zhang-dong-jian-1446133153.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qq-zhong-nian-wei-ji-1408289827.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-administrateur-general-du-cnam-1619206522.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-allades-1631959376.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-anna-sottilotta-1630417705.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-another-word-for-less-likely-1641721403.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-attaque-a-tunis-1433356632.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-bluestacks-keyboard-not-working-1637463746.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-celine-de-roany-1640557696.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-code-9-1661507082.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-danse-1460250714.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-david-shepard-restaurateur-de-film-1595246740.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-dr-heim-tampa-1631748962.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-dr-michael-valliere-1653406352.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-drapeau-canadien-1615473541.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-eric-singer-drums-1621083357.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-festival-corazon-latino-1644332358.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-fredrik-lundberg-1665847606.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-geographie-de-la-france-1620931197.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-great-falls-gun-club-1637348184.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-guerre-froide-1654846351.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-hovelhof-1461470750.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-i-squared-capital-linkedin-1653657436.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-initialiser-debat-dadmissibilite-1645273237.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-jesus-mendez-facebook-1642962807.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-journee-nationale-du-drapeau-gabonais-1628405454.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-lemke-software-gmbh-1625227146.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-lombocruralgie-francais-1656441384.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-marcel-caya-1628794563.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-metal-slug-foo-1624572900.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-musique-folklorique-bretonne-1631820741.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-neonazis-en-france-1663085614.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-obs-keyframe-interval-1657322209.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-ouat-once-upon-a-train-1643380520.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-phantasialand-1461344566.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-que-tal-magazine-1643474954.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-rmvmn-1619293679.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-rob-diamond-movies-1626693763.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-rosa-linux-1664389965.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-sacred-age-odysseria-1652523638.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-skerdi-dervishaj-1635917093.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-sporting-stadium-1640362241.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-steam-ubuntu-wiki-1592725715.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-the-owl-club-1666374443.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-toddlercon-1579361594.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-trouve-arc-bf4-1625314405.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-tv-horror-movies-chart-1667140806.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-unification-album-1626264528.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-victoria-zdrok-1632510384.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-volt-bulgarie-1628499772.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-what-is-beowulf-about-summary-1659304409.warc.gz
data/manual-annotations/archived-raw-serps/warcs/qwant-world-deutsch-regional-europa-deutschland-baden-wurttemberg-landkreise-heilbronn-stadte-und-gemeinde-1626329085.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-3ds-1364668924.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-b7-1650853917.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-flair-already-posted-https-redd-it-xamfzl-1667030236.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-german-nebelmittelwurfanlage-1664557458.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-how-can-i-access-nature-com-articles-1666041985.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-jailbait-1376244913.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-supermoon-1403887175.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-teleperformance-1260472045.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-touch-meme-1663170731.warc.gz
data/manual-annotations/archived-raw-serps/warcs/reddit-typetest-10fastfingers-1663797626.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-build-to-survive-black-people-1663785067.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-chernobyl-rp-1666555966.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-cut-1633682743.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-shorts-1357668619.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-soviet-union-1657601847.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-survival-1656759229.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-survive-the-killer-1640549700.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-welcome-to-the-town-of-robloxia-uncopylocked-1660007534.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-xo-so-88-gg8-run-1659417607.warc.gz
data/manual-annotations/archived-raw-serps/warcs/roblox-znation8000-1650350926.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-cesuk-163163163-cn-1493482889.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-eed-1-4a1-a-1332923188.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-j-1341637724.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-ju-min-shen-fen-zheng-hao-ma-he-xing-ming-1508756794.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-l-1346233371.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-lofke-yi-kua-shi-chang-mai-mai-1333092705.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-ti-gong-jin-kou-qi-qiang-1647324224.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-tu-guan-xin-gai-kuan-1332227339.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-xing-ai-ji-qiao-1576522689.warc.gz
data/manual-annotations/archived-raw-serps/warcs/sogou-yuan-dai-ma-xie-lu-1578201651.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-fonts-swing-jtextpane-1412916125.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-numpy-einsum-1516773912.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-objective-c-1354546520.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-remote-execution-1645839151.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-ruby-1-9-3-heroku-1398351399.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-ruby-on-rails-plugins-1613971498.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-scala-1355718931.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-text-mining-1522322354.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-vue-js-php-1647710017.warc.gz
data/manual-annotations/archived-raw-serps/warcs/stackoverflow-xampp-java-1547581001.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-linkid-js-1533168227.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-peringatan-dini-bmkg-kamis-18-februari-2021-1632679908.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-pilgub-dki-jakarta-2017-1491952670.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-polsek-tallo-1663047668.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-ricky-natapradja-1663049121.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-search-term-string-1607106977.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-search-term-string-1607120098.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-search-term-string-1607130238.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-search-term-string-1607224881.warc.gz
data/manual-annotations/archived-raw-serps/warcs/tribunnews-search-term-string-1607225592.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitch-a-plague-tale-innocence-1638358324.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitch-central-fluminense-1630540704.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitch-cpentagon-1640060311.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitch-juliversal-1629750531.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitch-rubberboy2001-1661349876.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitch-simplevar-1662753027.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitch-xxlillythefallenangelneko-1638019769.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-campaigns-1481768285.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-clubs-lang-sr-1591413117.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-ecotourism-1557315321.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-freemariabutina-1555124003.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-freemariabutina-1562498575.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-freemariabutina-1563062689.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-http-shop-pre-com-corona02-p-409033-1648579256.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-lauramajor-1652839406.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-rabble-ca-lang-ar-1442999332.warc.gz
data/manual-annotations/archived-raw-serps/warcs/twitter-rabble-ca-lang-fr-lang-id-1443046297.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-000-space-marine-1363614912.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-grot-1353834377.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-gta-1389323282.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-imperatory-illiuzii-1387125239.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-loco-roco-1377325114.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-muzyka-1372304839.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-rabotaiu-na-sebia-1361533546.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-radioelektronnye-sistemy-1361402773.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-sportivnye-mototsikly-1387080107.warc.gz
data/manual-annotations/archived-raw-serps/warcs/vk-technology-1383988940.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-bu-xiang-jiao-hun-li-de-fen-zi-qian-refer-focus-lx-stopic-box-1527256388.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-fu-cai-3dshu-ju-jia-wei-xin-xw639-2018-1555261848.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-hun-li-li-jie-refer-stopic-box-1505917853.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-ji-huo-ma-b-1-page-2-1433297692.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-kan-bu-jian-de-yan-pi-1409920649.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-li-wei-yi-refer-user-weibo-1517733046.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-meng-lin-dexiao-wu-1437753277.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-quan-ye-cha-page-13-1517932436.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-sheng-fu-lang-xi-si-1603546157.warc.gz
data/manual-annotations/archived-raw-serps/warcs/weibo-xiao-xiao-bin-refer-stopic-box-1518290095.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-ao-xian-yu-le-du-bo-ping-tai-1430758639.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-figures-in-theatrical-costumes-claude-gillot-1673-1722-class-photo-description-french-painter-drawer-1632572254.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-group-portrait-on-doorstep-collins-tudor-washington-1898-1970-photographer-75426-object-number-haswb-1629837781.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-la-dian-zi-ji-1517046182.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-mou-lin-han-site-pku-edu-cn-1576868395.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-nito-1655733503.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-oxygen-1596274448.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-prob-1543207125.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-recaptchalogo-svg-1509131182.warc.gz
data/manual-annotations/archived-raw-serps/warcs/wikimedia-zao-can-bao-zi-jia-meng-www-baidu-com-aaaa-4ws-2018nian-8yue-4ri-21shi-19fen-39miao-1537939782.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-casey-cavert-go-to-www-lovesbo-ru-1642784433.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-claire-dames-1325320932.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-drunk-1325431509.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-escola-sao-luis-1657929903.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-evander-marius-go-to-www-lovesbo-ru-1642716634.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-free-hardcore-porn-videos-japanese-video-1428541087.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-gay-peeing-porn-go-to-www-lovesbo-ru-1643357466.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-gay-whitezilla-go-to-www-lovesbo-ru-1643416941.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-robber-1248193170.warc.gz
data/manual-annotations/archived-raw-serps/warcs/xvideos-solo-1341894522.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-ashland-oregon-1015423512.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-bc-gov-971492707.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-bill-callahan-american-football-1636808341.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-castle-heights-angeles-1611631735.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-civil-code-1658358754.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-dating-sites-1647656764.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-diver-lg-u8180-1620023310.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-dunwells-army-of-friends-1617218301.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-envious-that-biden-1652739375.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-every-previewsworld-calls-1649106369.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-free-mail-centers-970285370.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-free-nude-pics-of-brittney-spears-970473571.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-free-pics-bbbw-1041625676.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-free-xxx-asian-pics-952102259.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-freeware-936293306.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-fresh-prince-of-bel-air-971413040.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-frugal-994624570.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-fruitarianism-970289154.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-full-speed-1011203807.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-funny-970842855.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-funny-pictures-943791338.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-futurama-1314932107.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-future-of-sport-971016077.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gabel-970409689.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gaelic-970435492.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gamefaq-970449707.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-games-970945905.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-games-puzzles-brain-teasers-sudoku-1574052323.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-games-video-games-developers-and-publishers-croteam-1624838167.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gamespot-portugal-1036145291.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gaming-club-997142327.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-ganze-filme-online-schauen-kostenlos-und-in-voller-lange-1376615487.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gay-shower-sex-961542771.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gender-discrimination-970694307.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-general-s-daughter-the-970749419.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-genserv-971364933.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-george-foreman-boxer-1040476713.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-georgetown-university-law-center-970779220.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-georgia-restaurant-association-970314665.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-german-pen-pals-961119166.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-ghar-1005251824.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-ghulam-sarwar-khan-1626337646.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gina-mckee-998889511.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-girlsandanimals-1039016411.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-glass-tools-961515348.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-global-and-parts-970542388.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-goddess-955975798.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gogi-grant-1041483222.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-golden-books-971368161.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-golf-poll-971193897.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-golson-1017320115.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-gordon-bruce-955082521.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-govote-com-955100292.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-hombres-con-pelo-en-el-pecho-photos-1359853955.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-isnt-even-weirdest-thing-america-right-1653343893.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-jello-gelatin-971145484.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-john-mccain-956454509.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-lawyer-career-information-970996615.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-learn-to-focus-1619373855.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-lm-1376048795.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-mark-schlissel-wife-1642367070.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-metallurgi-1042532635.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-molly-shannon-1640079691.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-region-de-coquimbo-970960857.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-sam-bush-1016625678.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-telekwiaciarnia-pl-1436841282.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-trans-texas-corridor-1613259804.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-wheatstone-bridge-1613009822.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-world-greek-kata-periokhe-boreia-amerike-kanadas-1647085990.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yahoo-world-hebrew-hbrh-shlvm-1489427128.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-danses-tv-periodic-1534841786.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-niusha-1515577404.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-speed-force-1535895408.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-speed-force-1535955246.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-speed-force-1535970436.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-speed-force-1535973684.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-speed-force-1536042339.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-speed-force-1536100368.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-spirited-away-animated-film-2001-1524478207.warc.gz
data/manual-annotations/archived-raw-serps/warcs/yandex-virat-swaroop-1523992633.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-ampatuanmassacre-1583309425.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-cardistry-asmr-1577113546.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-chto-budet-esli-sobrat-vse-rezinki-v-bully-1599555287.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-hp-probook-640-g1-razborka-1579996098.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-kak-sdelat-vzryv-v-cinema-4d-1578732009.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-kak-vybit-dushu-moba-1599057231.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-kutyaplya-1561171748.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-lataji-1563086980.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-literatura-6-klass-biografiia-pushkina-1595705363.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-ne-prosto-bekkhen-reaktsiia-1582514079.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-pora-tiulpanov-aktery-1574991226.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-prokhozhdenie-igry-madagaskar-2-chast-4-1562167916.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-pudding-1563068696.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-q2-2017-arizona-west-regional-1547871680.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-razbor-shchetki-pylesosa-samsung-1584184489.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-robloks-mip-siti-2019-1583715307.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-shang-yue-xian-rupu-1582390054.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-uzbekskaia-svadba-v-shymkente-1574145605.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-vasilii-emelianenko-tefteli-1578285143.warc.gz
data/manual-annotations/archived-raw-serps/warcs/youtube-zadnii-most-moskvich-412-ustroistvo-1584150216.warc.gz
docs/queries-tsne-teaser.png
docs/queries-tsne.png
helm/archive-query-log/.gitignore
helm/archive-query-log/.helmignore
helm/archive-query-log/Chart.yaml
helm/archive-query-log/values.yaml
helm/archive-query-log/templates/NOTES.txt
helm/archive-query-log/templates/archive-query-log-config-map.yml
helm/archive-query-log/templates/archive-query-log-cron-job-captures-fetch.yml
helm/archive-query-log/templates/archive-query-log-cron-job-captures-import-aql-22.yml
helm/archive-query-log/templates/archive-query-log-cron-job-serps-download-warc.yml
helm/archive-query-log/templates/archive-query-log-cron-job-serps-parse-url-offset.yml
helm/archive-query-log/templates/archive-query-log-cron-job-serps-parse-url-page.yml
helm/archive-query-log/templates/archive-query-log-cron-job-serps-parse-url-query.yml
helm/archive-query-log/templates/archive-query-log-cron-job-serps-parse-warc-query.yml
helm/archive-query-log/templates/archive-query-log-cron-job-serps-parse-warc-snippets.yml
helm/archive-query-log/templates/archive-query-log-cron-job-sources-build.yml
helm/archive-query-log/templates/archive-query-log-deployment-monitoring.yml
helm/archive-query-log/templates/archive-query-log-ingress-monitoring.yml
helm/archive-query-log/templates/archive-query-log-secret.yaml
helm/archive-query-log/templates/archive-query-log-service-monitoring.yml
integrations/ir_datasets/Dockerfile
integrations/ir_datasets/Makefile
integrations/ir_datasets/README.md
integrations/ir_datasets/archive_query_log_ir_datasets_integration.py
integrations/ir_datasets/data/results/part-00000.gz
integrations/ir_datasets/data/serps/part-00000.gz
integrations/tira/.gitignore
integrations/tira/Dockerfile
integrations/tira/README.md
integrations/tira/aql-experiment-baseline.py
integrations/tira/validation-data/results/part-00000.gz
integrations/tira/validation-data/serps/part-00000.gz
notebooks/.gitignore
notebooks/Makefile
notebooks/calculate-sbert-embeddings.ipynb
notebooks/evaluation_corpus_fields.ipynb
notebooks/evaluation_most_referenced_domains.ipynb
notebooks/evaluation_query_length.ipynb
notebooks/evaluation_results_per_serp.ipynb
notebooks/evaluation_services_overview.ipynb
notebooks/evaluation_time_series.ipynb
notebooks/evaluation_trec_overlap.ipynb
notebooks/evaluation_us_election.ipynb
notebooks/example_corpus_parquet.ipynb
notebooks/obscene_queries.ipynb
notebooks/obscene_words.json
notebooks/pornographic_queries.ipynb
notebooks/process_corpus.ipynb
notebooks/process_stats.ipynb
notebooks/services.txt
notebooks/figures/.gitignore
scripts/create_corpus.py
scripts/create_corpus.sh
scripts/download_corpus.sh