[
    {
        "text": "You should open your own Breakfast-Diner. I would be your everyday-guest, even If I had to move away from germany for that :D\nmums mums mums!\nIvy: Hahaha! Good idea. :)Melwa: :)\nSkicka en kommentar",
        "meta": {
            "lang": "en",
            "lang_score": 0.8643032908439636,
            "url": "http://365daysofbreakfast.blogspot.com/2011/07/monday.html",
            "timestamp": "2023-11-28T09:40:02Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05521472392638037
                ],
                [
                    3,
                    0.07975460122699386
                ],
                [
                    4,
                    0.10429447852760736
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 35,
            "mean_word_length": 4.6571428571428575,
            "num_of_sentences": 5,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9714285714285714,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Episode 20: Chris Guzikowski, Executive Editor, Pearson\nIn this episode of AgileNEXT, Chris Guzikowski joins Daniel and Stephen and takes us inside the sausage factory: showing us how a book is made and how you can get published. Some topics include: The Agile Book market and what the future looks like for publishing How to get published Career Development The Agile Community His time [\u2026]",
        "meta": {
            "lang": "en",
            "lang_score": 0.9383002519607544,
            "url": "http://agilenext.tv/tag/chris-guzikowski/",
            "timestamp": "2023-11-28T10:16:09Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04892966360856269
                ],
                [
                    3,
                    0.045871559633027525
                ],
                [
                    4,
                    0.07951070336391437
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 65,
            "mean_word_length": 5.030769230769231,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.015384615384615385,
            "fraction_of_words_with_alpha_character": 0.9692307692307692,
            "num_of_stop_words": 13,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Save my name, email, and website in this browser for the next time I comment.\n\u00a9 2023 Victoria Bakes.\nAll rights reserved. Web Design by Hello Pomelo.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8880177736282349,
            "url": "http://bakingintotheether.com/2016/05/23/sugar-donuts/img_2916/",
            "timestamp": "2023-11-28T09:01:29Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04878048780487805
                ],
                [
                    3,
                    0.08943089430894309
                ],
                [
                    4,
                    0.13821138211382114
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 27,
            "mean_word_length": 4.555555555555555,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9259259259259259,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "- Wandering Souls: Journeys with the Dead and Living in Vietnam; Karlin (paperbackswap)\n- Outside Boy; Cummins (paperbackswap)\n- My Name is Mary Sutter; Oliveira (Viking)\n- Scent of the Missing; Charleson (paperbackswap)\n- Never Wave Goodbye; Magee (Touchstone)\n- Every House Needs a Balcony; Frank (Harper)\n- The Bucolic Plague; Kilmer Purcell (Harper Collins)\n- Broke USA; Rivlin (Harper Collins)\n- Based on Availability; Strauss (Harper Collins)\n- October Suite; Clair\n- Blind Side of the Heart; White\n- All We Ever Wanted Was Everything; Brown\n- Lush Life; Price\n- Downhill Chance; Morrissey\n- Forsyte Saga; Galsworthy\n- A Reliable Wife; Goolrick",
        "meta": {
            "lang": "en",
            "lang_score": 0.687304675579071,
            "url": "http://bibliophilebythesea.blogspot.com/2010/06/mailbox-monday.html",
            "timestamp": "2023-11-28T08:43:44Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.08775137111517367
                ],
                [
                    3,
                    0.08775137111517367
                ],
                [
                    4,
                    0.043875685557586835
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 1.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 104,
            "mean_word_length": 5.259615384615385,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8461538461538461,
            "num_of_stop_words": 11,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "site map\nRooftop decks with 3600 views of Downtown,\nCamelback Mountain & Piestewa Peak\n3 bedrooms / 3 baths\n1,600-1,950 sq. ft.\n2 car garage\nGated entry\nCommunity pool & spa\nBiltmore/Arcadia area\nminutes to Biltmore Fashion Park,\nCamelback Corridor, La Grande Orange\nImmediate delivery\nLocated at 35th Street & Pinchot Ave (one block north of Thomas, one\nblock west of 36th Street see\nEmail: info@cosmohomes.com\nWeb design: Web-Writer,",
        "meta": {
            "lang": "en",
            "lang_score": 0.8029668927192688,
            "url": "http://brownstonesquare.com/?i=387-388-1",
            "timestamp": "2023-11-28T09:22:37Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.01907356948228883
                ],
                [
                    3,
                    0.03814713896457766
                ],
                [
                    4,
                    0.051771117166212535
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.028169014084507043,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 69,
            "mean_word_length": 5.318840579710145,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8695652173913043,
            "num_of_stop_words": 9,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Month: September 2019\n2 Things To Consider Before Accepting A Job Offer\nYou spend several days to write an impressive resume. You mailed it to several companies and now you are patiently waiting for their response. After\u2026\nTips for choosing the Right School for your Child\nSo, your child has finally reached the school-going age? Well, that is good news. Did you know that the type of school you choose for\u2026\nDoes neurofeedback help people with ADHD? Find out here\nSadly, Attention Deficit Hyperactivity Disorder or ADHD affects a lot of people around the world. They usually lose their impulse control, their attention is always\u2026",
        "meta": {
            "lang": "en",
            "lang_score": 0.9607195258140564,
            "url": "http://cadcamperformance.com/2019/09",
            "timestamp": "2023-11-28T09:49:03Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03435114503816794
                ],
                [
                    3,
                    0.03625954198473282
                ],
                [
                    4,
                    0.03816793893129771
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.42857142857142855,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 105,
            "mean_word_length": 4.9904761904761905,
            "num_of_sentences": 7,
            "symbol_to_word_ratio": 0.02857142857142857,
            "fraction_of_words_with_alpha_character": 0.9809523809523809,
            "num_of_stop_words": 21,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Whitelabel Error Page\nThis application has no explicit mapping for /error, so you are seeing this as a fallback.\nTue Nov 28 17:43:18 KST 2023\nThere was an unexpected error (type=Internal Server Error, status=500).\nUnable to find ezmeta.wqikan.domain.Issue with id 863417",
        "meta": {
            "lang": "en",
            "lang_score": 0.8595819473266602,
            "url": "http://caj.ezmeta.co.kr:8080/cajkor/article/00034461935",
            "timestamp": "2023-11-28T08:43:18Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.06521739130434782
                ],
                [
                    3,
                    0.08260869565217391
                ],
                [
                    4,
                    0.1
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 41,
            "mean_word_length": 5.609756097560975,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9024390243902439,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Factors to look at when in the search of the best Pet Sitting services In order to get access to the best Pet Sitting services in the flooded Market it is advisable that the client take their precious time to survey n evaluate the market trends 2ell. In this process [\u2026]\nFinding Parallels Between and Life\nCrafting an Exceptional Online Presence with Website Design Bournemouth Website design is an intricate fusion of creativity and technical precision, molding a platform that conveys your message with finesse and functionality. Within the vibrant confines of Bournemouth, this art form ascends to unparalleled heights, turning ordinary websites into captivating, immersive [\u2026]\n5 Key Takeaways on the Road to Dominating\nAn Overview to Picking the Right Family Law Office When confronted with lawful matters associated with family members issues, such as separation, child wardship, or adoption, it can be discouraging to browse the complex lawful system alone. Working with a trusted household law office can provide you with the experience [\u2026]",
        "meta": {
            "lang": "en",
            "lang_score": 0.9117600321769714,
            "url": "http://cfavbms.info/category/internet-services/",
            "timestamp": "2023-11-28T09:13:55Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.011337868480725623
                ],
                [
                    3,
                    0.022675736961451247
                ],
                [
                    4,
                    0.03854875283446712
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.030612244897959183
                ],
                [
                    6,
                    0.030612244897959183
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.6,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 166,
            "mean_word_length": 5.313253012048193,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.018072289156626505,
            "fraction_of_words_with_alpha_character": 0.9759036144578314,
            "num_of_stop_words": 44,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "\u20b9699.00 \u20b9549.00\nThere are no reviews yet.\nYour email address will not be published. Required fields are marked *\nYour review *\nName *\nEmail *\nSave my name, email, and website in this browser for the next time I comment.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9087914228439331,
            "url": "http://crazyybakers.com/product/chocolate-truffle-cake/",
            "timestamp": "2023-11-28T09:17:09Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.0782122905027933
                ],
                [
                    3,
                    0.10614525139664804
                ],
                [
                    4,
                    0.12290502793296089
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 41,
            "mean_word_length": 4.365853658536586,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8536585365853658,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "About Us\nOur Services\nBurial or Graveside Services\nCremation Services\nMemorial Services\nFuneral Planning\nFuneral Pre-Planning\nGrief & Guidance\nGrief Support\nUse the form above to find your loved one. You can search using the name of your loved one, or any family name for current or past services entrusted to our firm.Click here to view all obituaries",
        "meta": {
            "lang": "en",
            "lang_score": 0.7833401560783386,
            "url": "http://crgamble.frontrunnerpro.com/book-of-memories/3619352/Gillan-Ted/service-details.php",
            "timestamp": "2023-11-28T08:39:09Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.061016949152542375
                ],
                [
                    3,
                    0.03389830508474576
                ],
                [
                    4,
                    0.061016949152542375
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.01694915254237288,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 58,
            "mean_word_length": 5.086206896551724,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9827586206896551,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Dennis Burnett Photography, Austin Texas Editorial, Commercial, Lifestyle, and Food photography\nCampaign: Dennis Burnett is an Austin, Texas based photographer who specializes in editorial, lifestyle and portrait photography: Successful Workout\n- New Work\n- Overview\n- Lifestyle\n- Food and Beverage\n- Corporate\n- Fitness\n- Industrial\n- Austin Makers\n- Campaign\n- Portraits\n- Editorial\n- Studio\n- Video\n- Private Galleries\n- About me\n- Contact\nDennis Burnett @ 2012 Austin Texas Commcerial, Lifestyle, and Editorial Photographer. Site design \u00a9 2010-2023 Neon Sky Creative Media",
        "meta": {
            "lang": "en",
            "lang_score": 0.79268479347229,
            "url": "http://dennisburnettphotography.com/campaign/campgladiator/Texas_Fitness_Sports_Lifestyle_Photographer_91",
            "timestamp": "2023-11-28T10:03:49Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.07959183673469387
                ],
                [
                    3,
                    0.05102040816326531
                ],
                [
                    4,
                    0.06326530612244897
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.8421052631578947,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 87,
            "mean_word_length": 5.632183908045977,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.7701149425287356,
            "num_of_stop_words": 14,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Powered by WordPress\nUsername or Email Address\nRemember Me\nLost your password?\n\u2190 Go to Detroit Santarchy\nPrivacy Policy\nBy proceeding you understand and give your consent that your IP address and browser information might be processed by the security plugins installed on this site.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9227597117424011,
            "url": "http://detroitsantarchy.net/home/wp-login.php?redirect_to=http%3A%2F%2Fdetroitsantarchy.net%2Fhome%2Fwp-admin%2F&reauth=1",
            "timestamp": "2023-11-28T09:10:20Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.037815126050420166
                ],
                [
                    3,
                    0.07563025210084033
                ],
                [
                    4,
                    0.1092436974789916
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.021739130434782608,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 45,
            "mean_word_length": 5.288888888888889,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9777777777777777,
            "num_of_stop_words": 8,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "The iron bar is made of Q235A low carbon steel and galvanized, and wrapped with ABS plastic shell; the lock body is made of high-quality yuan steel cold forging with O-type or diamond shaped spring ring. Laser, hot stamping, digital, trademark, bar code can be used, the identification is clear and easy to read;\nApplications can be used in containers, trailers, tankers, shipping, railway transportation, logistics, freight, safe, lockers, etc",
        "meta": {
            "lang": "en",
            "lang_score": 0.898637056350708,
            "url": "http://dh-seals.com/h-pd-3.html",
            "timestamp": "2023-11-28T08:42:56Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.032
                ],
                [
                    3,
                    0.042666666666666665
                ],
                [
                    4,
                    0.032
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 70,
            "mean_word_length": 5.357142857142857,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 13,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Under Knowledge you will find links to the newly produced bite-sized videos on CDIO Standards and Syllabus. Link to the videos Category: Blog posts on March 23, 2022 - 04:06 katel",
        "meta": {
            "lang": "en",
            "lang_score": 0.8957793116569519,
            "url": "http://ekrs.cdio.org/news/new-videos-cdio-standards-and-syllabus",
            "timestamp": "2023-11-28T10:06:10Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.06711409395973154
                ],
                [
                    3,
                    0.11409395973154363
                ],
                [
                    4,
                    0.14093959731543623
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 31,
            "mean_word_length": 4.806451612903226,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8709677419354839,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Important dates\nUntil April 19, 2021 registration of participants, filling out an application for a report, submission of abstracts\nUntil May 1, 2021 notification of the inclusion of the report in the program, invitation to participate in the conference\nUntil June 15, 2021 arrival confirmation, arrival information\nJuly 5, 2021 day of arrival\nJuly 9, 2021 departure day",
        "meta": {
            "lang": "en",
            "lang_score": 0.909961998462677,
            "url": "http://epps2021.itam.nsc.ru/en/imp_dates;jsessionid=C93F4FB7024FB108232340DB7DEAE193",
            "timestamp": "2023-11-28T09:13:17Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03194888178913738
                ],
                [
                    3,
                    0.06070287539936102
                ],
                [
                    4,
                    0.07667731629392971
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 58,
            "mean_word_length": 5.396551724137931,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8275862068965517,
            "num_of_stop_words": 10,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Issues of the Heart \u2013 Bitterness June 13, 2021 Brian Bitterness, Heart God looks at our hearts and out of them flow the issues of life, so we need to make sure our hearts are whole and healthy. This week, bitterness.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9451563954353333,
            "url": "http://everynationtr.org/sermon-tag/bitterness/",
            "timestamp": "2023-11-28T10:31:58Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.09090909090909091
                ],
                [
                    3,
                    0.0625
                ],
                [
                    4,
                    0.09090909090909091
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 41,
            "mean_word_length": 4.2926829268292686,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.926829268292683,
            "num_of_stop_words": 9,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "You aren't allowed to view the forum statistics.\nPlease login below or register an account with .\nForgot your password?\nSubmit Headstamps",
        "meta": {
            "lang": "en",
            "lang_score": 0.8744357824325562,
            "url": "http://forum.afte.org/index.php?action=stats",
            "timestamp": "2023-11-28T10:49:57Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.07758620689655173
                ],
                [
                    3,
                    0.13793103448275862
                ],
                [
                    4,
                    0.15517241379310345
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 22,
            "mean_word_length": 5.2727272727272725,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9545454545454546,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "http://blogs.zdnet.com/Spyware/?p=31 without digging round the www. too much on such a well worn subject just thought it worth a mention of some of the pitfalls of using filesharing apps many, infact most of them carry spyware adware and junk stuff in the installation so people out there just beware and do a little research before installing this type of program,this is as well as the legal side of people getting sued for thousand of dollars for downloading copyrighted files ie music films etc etc etc,is it worth it the choice is yours, read through past posts on kazaa and other filesharing apps for more detailed advice on the legal side of things,locustfurnace provided very detailed info on the legal aspects in many threads",
        "meta": {
            "lang": "en",
            "lang_score": 0.9173251986503601,
            "url": "http://forum.oldversion.com/showthread.php?2802-P2p-File-Sharing-Programs&s=1775d65d027ec384bfe6438dba9e479c&p=15152&viewfull=1",
            "timestamp": "2023-11-28T10:12:19Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.0392156862745098
                ],
                [
                    3,
                    0.0392156862745098
                ],
                [
                    4,
                    0.0457516339869281
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 123,
            "mean_word_length": 4.975609756097561,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 26,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "The Buildings & Grounds ministry is responsible for the maintenance, upkeep, and oversight of our property, buildings and church van, with the assistance of the custodian and hired contractors and vendors.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9532409906387329,
            "url": "http://fpcbainbridge.com/people/pat-thompson/",
            "timestamp": "2023-11-28T09:53:26Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.06857142857142857
                ],
                [
                    3,
                    0.07428571428571429
                ],
                [
                    4,
                    0.11428571428571428
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 31,
            "mean_word_length": 5.645161290322581,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.967741935483871,
            "num_of_stop_words": 13,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "For those of you who like to get all your ducks in a row from the start, there is a way to SAVE MONEYby ordering a bundle that includes your fitness program, your supplements, and a VIP club membership, along with free shipping on everything, for a much reduced rate.\nThis bundle is called a \u201cChallenge Pack\u201d \u2014 and there is a Challenge Pack available for nearly all of Beachbody\u2019s most popular workout programs. Click below for details on your program of choice =\n** There are also other Challenge Packs available for which I didn\u2019t dedicate a separate page, but you can learn more about them directly on TeamBeachbody by clicking the links below =\nAnd don\u2019t forget that along with getting your Challenge Pack, I encourage you to enter the Beachbody Challenge for your chance to CASH IN on your results!! Learn more here\n[...] Challenge Packs [...]\n[...] Challenge Packs [...]",
        "meta": {
            "lang": "en",
            "lang_score": 0.9367748498916626,
            "url": "http://getrippedathome.com/programs/challenge-packs/",
            "timestamp": "2023-11-28T10:52:58Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.16666666666666666,
            "fraction_of_characters_in_duplicate_lines": 0.03319502074688797,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.058091286307053944
                ],
                [
                    3,
                    0.022130013831258646
                ],
                [
                    4,
                    0.06639004149377593
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.3333333333333333,
            "fraction_of_lines_starting_with_bullet_point": 0.16666666666666666,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 154,
            "mean_word_length": 4.694805194805195,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.025974025974025976,
            "fraction_of_words_with_alpha_character": 0.948051948051948,
            "num_of_stop_words": 28,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Italy\u2019s Mediterranean Policy\n10 min read\nItaly is in a position, looking from a geographical and geostrategic point of view, to play one...\nElectronic Magazine On Global Politics, International Relations, History and World Security Since April 2014",
        "meta": {
            "lang": "en",
            "lang_score": 0.8607285618782043,
            "url": "http://global-politics.eu/tag/tripoli/",
            "timestamp": "2023-11-28T10:22:24Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.09433962264150944
                ],
                [
                    3,
                    0.12264150943396226
                ],
                [
                    4,
                    0.1320754716981132
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.25,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 37,
            "mean_word_length": 5.72972972972973,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.02702702702702703,
            "fraction_of_words_with_alpha_character": 0.9459459459459459,
            "num_of_stop_words": 5,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "A beautiful, relaxing and wondrous trip down the long and winding, rugged green west coast of Ireland will build your health and energy better than any medication. The west coast of Ireland is a great place to go to see amazing landscapes such as the huge flat topped mountain of Ben Bulben, verdant greenery, the [\u2026]",
        "meta": {
            "lang": "en",
            "lang_score": 0.9299318790435791,
            "url": "http://greatraveling.com/tag/surfing/",
            "timestamp": "2023-11-28T10:50:57Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.06870229007633588
                ],
                [
                    3,
                    0.08396946564885496
                ],
                [
                    4,
                    0.13740458015267176
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 1.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 56,
            "mean_word_length": 4.678571428571429,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.017857142857142856,
            "fraction_of_words_with_alpha_character": 0.9821428571428571,
            "num_of_stop_words": 20,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "<p>I have talked about [lk:fundable.org] here before. I have noe been a part of two failed funable.org campaigns. Granted one of them was aborted by the organizer early on, but the other was fairly modest (20 people x $12 for some bumper stickers). I just received notice that the campaign didn't meet its goal. So here are some problems i see with fundable right now</p> <ul> <li>There is NO WAY to revise a cmapaign once it starts and you must wait until the campaign fails (a month later) to end it. </li><li>There is no EASY way for a participant to contribute more than a single incremental contribution. Organizers should be able to set a contribution scale ($20, $50, $100, $250) </li><li>There is no AUTOMATED reminder that a campaign is coming to an end Basically every week there should be an update, with a link to notifyu more people about the funable campaign. So if the campaign is not meeting its goal, people who have already signed up can get informed in a passive way and choose to tell others to make a donation. </li><li>There is no way to scale back a goal. In many cases of group purchasing it is probably that you will know exactly what the item you want to buy costs, but what if you find one online for half the price (let say it is a pottery wheel, now instead of costing $1000 it costs $500), the organizer cannot revise the goal down to this new price, and if the $1000 goal is not met, the organizer has to start all over again. in the open source bounty scenario, a developer may offer to do the work far cheaper than originally estimated. </li><li>Matching campaigns: after starting a campaign, someone might discover it and decide that it is so worthy, they are willing to match other contributions (on a 1:1 or 2:1 basis) this could happen with philanthopic individuals or foundations, or individuals. But there is not way to accommodate this development <ul> <p>Basically fundable assumes that you have all your ducks in a row when you set out to create your campaign and that there will be no bumps in the road, nor posative changes in circumstances.</p> <p>These few small tweaks above could make fundable that much more useful of a tool.</p> </ul></li></ul>\nRecent Posts\nRecent Comments\n- February 2023\n- October 2021\n- September 2020\n- July 2020\n- February 2020\n- June 2019\n- November 2018\n- March 2017\n- November 2016\n- October 2016\n- August 2016\n- April 2016\n- March 2016\n- February 2016\n- August 2015\n- April 2015\n- March 2015\n- February 2015\n- April 2014\n- December 2013\n- November 2013\n- February 2012\n- January 2012\n- December 2011\n- November 2011\n- September 2011\n- May 2011\n- April 2011\n- March 2011\n- February 2011\n- January 2011\n- December 2010\n- November 2010\n- October 2010\n- September 2010\n- August 2010\n- July 2010\n- May 2010\n- April 2010\n- March 2010\n- February 2010\n- January 2010\n- December 2009\n- November 2009\n- October 2009\n- September 2009\n- August 2009\n- July 2009\n- June 2009\n- May 2009\n- April 2009\n- March 2009\n- February 2009\n- December 2008\n- November 2008\n- October 2008\n- September 2008\n- August 2008\n- July 2008\n- June 2008\n- May 2008\n- April 2008\n- March 2008\n- February 2008\n- January 2008\n- December 2007\n- November 2007\n- October 2007\n- September 2007\n- August 2007\n- July 2007\n- June 2007\n- May 2007\n- April 2007\n- March 2007\n- February 2007\n- January 2007\n- December 2006\n- November 2006\n- October 2006\n- September 2006\n- August 2006\n- July 2006\n- June 2006\n- May 2006\n- April 2006\n- March 2006\n- February 2006\n- January 2006\n- December 2005\n- November 2005\n- October 2005\n- September 2005\n- August 2005\n- July 2005\n- June 2005\n- May 2005\n- April 2005\n- March 2005\n- February 2005\n- January 1970",
        "meta": {
            "lang": "en",
            "lang_score": 0.9747705459594727,
            "url": "http://gregoryheller.com/2005/making-fundable-org-better/",
            "timestamp": "2023-11-28T10:33:14Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.036290322580645164
                ],
                [
                    3,
                    0.018145161290322582
                ],
                [
                    4,
                    0.006048387096774193
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0014388489208633094,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.9619047619047619,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 694,
            "mean_word_length": 4.2881844380403455,
            "num_of_sentences": 13,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.6930835734870316,
            "num_of_stop_words": 110,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Don't have an account? Register\nGX12 BOT allows you to shop from anywhere in the world.\nJoin our subscribers list to get the latest news, updates and special offers directly in your inbox\nLast added products",
        "meta": {
            "lang": "en",
            "lang_score": 0.8920621871948242,
            "url": "http://gx12bot.com/",
            "timestamp": "2023-11-28T08:49:12Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05232558139534884
                ],
                [
                    3,
                    0.06395348837209303
                ],
                [
                    4,
                    0.11046511627906977
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.02702702702702703,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 36,
            "mean_word_length": 4.777777777777778,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 8,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "autoclave container us manufacturer\nAug 23, 2018 // By:Jenny Wu // No Comment\nAutoclavable Containers, Autoclavable Containers Suppliers \u2026\nAutoclavable Containers, \u2026 Sterilizer / Sterilization Container Autoclave \u2026 delivery services Manufacturer and Exporter worldwide Surgical \u2026 Autoclavable Surgical Container, Autoclavable Surgical \u2026\nAutoclavable Surgical Container, Wholesale Various High Quality Autoclavable Surgical Container Products from Global Autoclavable Surgical Container Suppliers and Autoclavable Surgical Container Factory,Importer,Exporter at Alibaba.com. Autoclavable Plastic Containers at Thomas Scientific\nAutoclavable Plastic Containers found in: Polypropylene Wide Mouth Containers, Chemware Teflon\u00ae PFA Wide Mouth Jars, Tri-Stir Beakers, Cellulose Nitrate.. Autoclave Sterilizer, Autoclave Manufacturers, Wholesale \u2026\nExplore Autoclaves & Sterilizers \u2026 Portable Autoclave Portable Autoclave Our expertise enables us to manufacture and \u2026 as the reliable manufacturer and exporter \u2026\nAutoclave Container at Thomas Scientific Autoclave Container found in: Polycap TF PTFE Membrane Capsule Filters, Whatman Syringe Type Holders, Whatman Polydisc In-line Filters, TF, Scienceware\u00ae.. Bondtech \u2013 Medical Waste Autoclave and Composite Autoclave \u2026 Serving over 32 countries and counting, Bondtech has a proven record for international leadership in the autoclave industry. Sterilization container \u2013 All medical device manufacturers \u2026 Find your sterilization container easily \u2026 Duradex pans are compatible with washer and even autoclave \u2026 Contact the manufacturer to get an estimate \u2026 Pans and Trays \u2013 Containers | Sigma-Aldrich Sigma-Aldrich Online Catalog Product List: Pans and Trays High Volume Commercial Plants Hospital Installations High Volume Commercial Plants Hospital Installations \u2026 autoclave market and it has given us the respect of the industry. Bondtech is the largest manufacturer \u2026\nChina Class B Electric Digital Dental Autoclave Steam \u2026\nChina Class B Electric Digital Dental Autoclave Steam \u2026 Autoclave Equipment manufacturer / supplier \u2026 or e-mail to us regarding any technical or \u2026 China Autoclave suppliers, Autoclave manufacturers \u2026\nChina Autoclave suppliers \u2026 Verified Manufacturer \u2026 Come and meet us at the Fair! Register. Come and see our product at the Fair! Medical Autoclave \u2013 Medical Autoclave Manufacturers \u2026\nGet listings of medical autoclave, \u2026 and latest technical support help us in \u2026 in the industry as an eminent manufacturer and supplier of \u2026 Autoclaves \u2013 Manufacturers, Suppliers & Exporters in India\nContact verified Autoclaves Manufacturers, \u2026 The Cement Autoclave provided by us is suitable for \u2026 The company is a renowned Horizontal Autoclave Manufacturer, \u2026 Autoclavable Polypropylene Container at Thomas Scientific\nAutoclavable Polypropylene Container \u2026 Ideal spill trays for autoclaving waste disposal containers such as the Dynalon Bio-bins Autoclave tray for \u2026 Follow Us \u2026\nSterilizers \u2013 Portable Single Drum Autoclave Manufacturer \u2026 Manufacturer of Sterilizers \u2013 Portable Single Drum Autoclave, Vertical Autoclave Double Drum(S.S) offered by Advanced Technocracy Inc., Ambala, Haryana Pans and Trays \u2013 Containers | Sigma-Aldrich Sigma-Aldrich Online Catalog Product List: Pans and Trays ASME Autoclave \u2013 Manufacturer from Coimbatore Manufacturer of ASME Autoclave \u2013 ASME U Stamp Autoclave, ASME Certified Autoclave and Code Autoclave offered by Autotherm Equipments Corporation, Coimbatore, Tamil Nadu Medical sterilizer \u2013 All medical device manufacturers \u2013 Videos Vertical space-saving autoclave for medical working room * Quick Lock Lid \u2026 TELL US WHAT YOU THINK. \u2026 Contact the manufacturer to get an estimate or \u2026 Automatic Steam Sterilizer Class B Autoclave \u2013 Buy Steam \u2026 Automatic Steam Sterilizer Class B Autoclave , Find Complete Details about Automatic Steam Sterilizer Class B Autoclave,Steam Sterilizer,Sterilizer,Autoclave from Sterilization Equipments Supplier or Manufacturer-Cixi Tonsor Medical Instrument Co., Ltd.\nAutoclave (industrial) \u2013 Wikipedia Such is the quality of autoclave door design that the US experiences as few \u2026 Doing this right depends upon providing the correct data to the autoclave manufacturer.",
        "meta": {
            "lang": "en",
            "lang_score": 0.7060972452163696,
            "url": "http://industrialboiler.cc/autoclave-container-us-manufacturer/",
            "timestamp": "2023-11-28T08:54:59Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.033296337402885685
                ],
                [
                    3,
                    0.013318534961154272
                ],
                [
                    4,
                    0.02413984461709212
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.10793562708102108
                ],
                [
                    6,
                    0.07214206437291898
                ],
                [
                    7,
                    0.05910099889012209
                ],
                [
                    8,
                    0.04800221975582686
                ],
                [
                    9,
                    0.037458379578246395
                ],
                [
                    10,
                    0.037458379578246395
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5625,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 585,
            "mean_word_length": 6.160683760683761,
            "num_of_sentences": 8,
            "symbol_to_word_ratio": 0.06666666666666667,
            "fraction_of_words_with_alpha_character": 0.8871794871794871,
            "num_of_stop_words": 116,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "This is a very cool thing Reebok is doing:\nBoston Strong Tees from Reebok \u2013 100% of the profits from the sale of the Boston Strong Tees will be donated to The One Fund Boston, Inc. to help the people most affected by the tragic events that occurred in Boston on April 15, 2013.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9618316888809204,
            "url": "http://integrativemom.com/tag/boston-strong-reebok/",
            "timestamp": "2023-11-28T10:26:45Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.10714285714285714
                ],
                [
                    3,
                    0.14285714285714285
                ],
                [
                    4,
                    0.049107142857142856
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 54,
            "mean_word_length": 4.148148148148148,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9259259259259259,
            "num_of_stop_words": 17,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Jenna Nash-McCabe is a mother, wife and mortgage specialist living in Valleyview, Kamloops. She lives with her husband Tyrone and two daughters, Brooklyn and Harper. While Jenna works at Mortgage West, Tyrone is the manager of Utility Services with the Thompson-Nicola Regional District (TNRD). Like so any families in Kamloops, the Nash-McCabe family enjoys playing [\u2026]",
        "meta": {
            "lang": "en",
            "lang_score": 0.9478633999824524,
            "url": "http://jennamortgagebroker.com/category/kamloops/",
            "timestamp": "2023-11-28T10:36:50Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.050793650793650794
                ],
                [
                    3,
                    0.05714285714285714
                ],
                [
                    4,
                    0.06031746031746032
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 1.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 56,
            "mean_word_length": 5.625,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.017857142857142856,
            "fraction_of_words_with_alpha_character": 0.9821428571428571,
            "num_of_stop_words": 13,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Skip to main navigation\nIt's on Beaugeon\nNews media\nCompany news\nIndustry news\nProduct display\nA track spotlights series\nTrack spotlights series\nSeries 65 track spotlights\n6 series track spotlights\n7 series track spotlights\n8 series track spotlights\n8 series projection light without blue edge\nOverhead lighting track spotlights\nM series triangular wall washing lamp\nShowcase lamp series\nBuilt-in mini downlights\nStrip wall wash light\nMini track spotlights\nMini orbit\nMini desktop zoom vertical rod spotlights\nTrack system\nThree wire single loop track\nFour-wire, three-loop track\nDownlight series\nDirect downlights\nSquare downlight\nCorner downlight\nProject case appreciation\nParty history Museum case\nMuseum series\nProject case\nGallery series\nScience Museum Series\nMemorial series\nNature Museum series\nPlanning Library Series\nHotel series\nFactory series\nDownload center\nElite recruitment\nContact us\nShowcase lamp series\n2.5 \"shrapnel mounted mini downlight\n2.5 \"spring mounted mini downlight\n2 inch ceiling mounted mini downlight products\n2 \"thread mounted mini downlight products\n2.5 \"embedded parts with mini downlights",
        "meta": {
            "lang": "en",
            "lang_score": 0.7722927331924438,
            "url": "http://jhegr.young-train.net/products/9",
            "timestamp": "2023-11-28T09:03:00Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.020833333333333332,
            "fraction_of_characters_in_duplicate_lines": 0.018711018711018712,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.12474012474012475
                ],
                [
                    3,
                    0.08731808731808732
                ],
                [
                    4,
                    0.04573804573804574
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.029106029106029108
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.018404907975460124,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 160,
            "mean_word_length": 6.0125,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9375,
            "num_of_stop_words": 8,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "BCCA New Syllabus.\nMerit List for Admission in First Year for the Session 2020-21\nSilver Jubilee Celebration\nExam Fees Notice\nAll Students are hereby informed to fill their Scholarship Forms on Welfare Office Portal before prior period.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8630855083465576,
            "url": "http://jncwadi.ac.in/ViewPhotoGallery.aspx?Data=em",
            "timestamp": "2023-11-28T10:12:06Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.035
                ],
                [
                    3,
                    0.08
                ],
                [
                    4,
                    0.105
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 37,
            "mean_word_length": 5.405405405405405,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.972972972972973,
            "num_of_stop_words": 5,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "The photoshoot team at Ballintaggart house Dingle for a vintage inspired photoshoot in Dingle Co Kerry\nWe would like to hear from you with any feedback about our website or products.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9370946288108826,
            "url": "http://kerryhairdresser.ie/ballintaggart-house-photo-shoot/attachment/054/",
            "timestamp": "2023-11-28T09:56:29Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.08552631578947369
                ],
                [
                    3,
                    0.1118421052631579
                ],
                [
                    4,
                    0.125
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 31,
            "mean_word_length": 4.903225806451613,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 5,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Opera for Mobile Devices - Download\nDownload Opera Mini 8\nDownload in another language.\nOther download options\nFor more information, visit www.opera.com/mobile with your desktop browser",
        "meta": {
            "lang": "en",
            "lang_score": 0.7749639749526978,
            "url": "http://m.opera.com/?region=bg&act=lp&vid=0xbc9454fdb232de4b&tag=mini5&rnd=2499415942&cert=none",
            "timestamp": "2023-11-28T11:22:05Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05
                ],
                [
                    3,
                    0.0875
                ],
                [
                    4,
                    0.13125
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.037037037037037035,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 26,
            "mean_word_length": 6.153846153846154,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9230769230769231,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Opera for Mobile Devices - Download\nDownload Opera Mini 8\nDownload in another language.\nOther download options\nFor more information, visit www.opera.com/mobile with your desktop browser",
        "meta": {
            "lang": "en",
            "lang_score": 0.7245530486106873,
            "url": "http://m.opera.com/?rnd=3266146002&act=lp&utm_campaign=hp_to_m_opera_com&utm_medium=ip&utm_source=opcom_hp_wap&tag=mini5&vid=0x704c83ea7ccd958b&region=ga&cert=none",
            "timestamp": "2023-11-28T11:01:24Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05
                ],
                [
                    3,
                    0.0875
                ],
                [
                    4,
                    0.13125
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.037037037037037035,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 26,
            "mean_word_length": 6.153846153846154,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9230769230769231,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Opera for Mobile Devices - Download\nDownload Opera Mini 8\nDownload in another language.\nOther download options\nFor more information, visit www.opera.com/mobile with your desktop browser",
        "meta": {
            "lang": "en",
            "lang_score": 0.678227424621582,
            "url": "http://m.opera.com/?tag=mini5&region=fy&rnd=3278469069&cert=none&vid=0x235b0b592dfc036a&utm_medium=ip&utm_source=opcom_hp_wap&utm_campaign=hp_to_m_opera_com&act=lp",
            "timestamp": "2023-11-28T11:28:42Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05
                ],
                [
                    3,
                    0.0875
                ],
                [
                    4,
                    0.13125
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.037037037037037035,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 26,
            "mean_word_length": 6.153846153846154,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9230769230769231,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Opera for Mobile Devices - Download\nDownload Opera Mini 8\nDownload in another language.\nOther download options\nFor more information, visit www.opera.com/mobile with your desktop browser",
        "meta": {
            "lang": "en",
            "lang_score": 0.7065049409866333,
            "url": "http://m.opera.com/?utm_source=opcom_hp_wap&vid=0x059551f10c7529fb&act=lp&region=ar&tag=mini5&utm_campaign=hp_to_m_opera_com&rnd=1916998633&utm_medium=ip&cert=none",
            "timestamp": "2023-11-28T11:20:11Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05
                ],
                [
                    3,
                    0.0875
                ],
                [
                    4,
                    0.13125
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.037037037037037035,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 26,
            "mean_word_length": 6.153846153846154,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9230769230769231,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Opera for Mobile Devices - Download\nDownload Opera Mini 8\n(English (Indonesia))\nDownload in another language.\nOther download options\nFor more information, visit www.opera.com/mobile with your desktop browser",
        "meta": {
            "lang": "en",
            "lang_score": 0.7177231311798096,
            "url": "http://m.opera.com/?utm_source=opcom_hp_wap&vid=0x99d940ce977e4308&act=lp&region=en-id&tag=mini5&utm_campaign=hp_to_m_opera_com&rnd=1715378656&utm_medium=ip&cert=none",
            "timestamp": "2023-11-28T10:32:25Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.044444444444444446
                ],
                [
                    3,
                    0.07777777777777778
                ],
                [
                    4,
                    0.11666666666666667
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 28,
            "mean_word_length": 6.428571428571429,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9285714285714286,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Opera for Mobile Devices - Download\nDownload Opera Mini 8\n(English (Indonesia))\nDownload in another language.\nOther download options\nFor more information, visit www.opera.com/mobile with your desktop browser",
        "meta": {
            "lang": "en",
            "lang_score": 0.7177231311798096,
            "url": "http://m.opera.com/?vid=0xf4e121e4f82b35b7&cert=none&rnd=2182509351&utm_source=opcom_hp_wap&utm_campaign=hp_to_m_opera_com&utm_medium=ip&region=en-id&act=lp&tag=mini5",
            "timestamp": "2023-11-28T11:06:24Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.044444444444444446
                ],
                [
                    3,
                    0.07777777777777778
                ],
                [
                    4,
                    0.11666666666666667
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 28,
            "mean_word_length": 6.428571428571429,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9285714285714286,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "A facial treatment is an intensive cleansing method done by an experienced licensed esthetician who gently exfoliates, moisturizes, and cleans\u2026\nThere are several villas in Goa that are affordable and provide you with all the luxuries. You may choose a\u2026\nBlue Peter introduces its presenters like jumping from a plane doing something daring and dramatic. However, from home because of\u2026",
        "meta": {
            "lang": "en",
            "lang_score": 0.9667429327964783,
            "url": "http://madinkpress.com/category/entertainment/",
            "timestamp": "2023-11-28T08:59:23Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.021604938271604937
                ],
                [
                    3,
                    0.04938271604938271
                ],
                [
                    4,
                    0.05555555555555555
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 1.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 60,
            "mean_word_length": 5.4,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.05,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 10,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Top 130+ Css floating animation\nCss floating animation Lovely funny images bring many useful information experiences for all users.\n1 Css floating animation Youtube\nFloating Text Animation Effects | Html CSS Animation \u2013 YouTube\nWith Css floating animation , Every detail in the image is created with passion and care to bring out the best experience for the view\nHere is a collection of beautiful pictures by Dwaipayan Mazumdar, You can see a series of pictures and other topics in the beautiful pictures category Animal of merkantilaklubben.org compilation and compilation.",
        "meta": {
            "lang": "en",
            "lang_score": 0.7939780950546265,
            "url": "http://merkantilaklubben.org/top-130-css-floating-animation/",
            "timestamp": "2023-11-28T09:40:09Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.09072164948453608
                ],
                [
                    3,
                    0.16494845360824742
                ],
                [
                    4,
                    0.03711340206185567
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 90,
            "mean_word_length": 5.388888888888889,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9444444444444444,
            "num_of_stop_words": 22,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "What is Community Property? Washington is a Community property state. Upon dissolution, the Court must distribute all the property owned by the parties between them (both community and separate). The Court first determines whether the property is characterized as community property or separate property. Separate property is that which one spouse owned before the marriage [\u2026]\nCommunity Property Agreement\nEstate Planning: Community Property Agreement Washington is a community property state, which means that all property in the state of Washington is either community property or separate property. Separate property is that which is owned before the marriage or received as a gift or inheritance during the marriage. All other property acquired during marriage as [\u2026]\nCost of Wills Affordable\nEstate Planning: Cost of Wills What is the cost of Wills? We do a variety of Washington wills and other estate planning documents for our clients at an affordable fixed price and cost. For your convenience, some examples of the cost of wills and other estate planning documents are as follows: Simple Will (single person) [\u2026]\nDeath and Eternity\nDeath and Eternity A client recently came into the office to have a Will, Durable Power of Attorney and Health Care Directive prepared. He just found out he had cancer, and was given only about a month to live. To say the least, he was in a state of shock. As a lawyer, we are [\u2026]\nDurable Power of Attorney\nEstate Planning: Durable Power of Attorney In thinking through your estate planning, a document you should consider is a Durable Power of Attorney (POA). This is a document that gives someone else the power to legally sign documents and make decisions on your behalf. Without adequate safeguards, this can be a dangerous document because that [\u2026]\nPower of Attorney for Children\nDo you have a Power of Attorney for your adult children? Do you realize the possible need for one and the potential consequence of not having one? A Power of Attorney is a document that allows another person to make decisions and sign documents on your behalf. These are important documents in estate planning. Typically [\u2026]\nPrenuptial Agreement\nFamily Law: Prenuptial Agreement A Prenuptial Agreement is a contract entered into by two people before their marriage. They redefine the laws of the State of Washington and how it applies to their specific marriage. They often decide how property will be divided if they get a divorce, legal separation, annulment, of when one of [\u2026]\nRevocable Living Trust\nEstate Planning Tools: Revocable Living Trust A Revocable Living Trust has become popular estate planning tool to pass property to heirs after you die and to avoid probate. Like a will, the trust is revocable so you can modify or eliminate it at any time. The written trust agreement appoints a trustee to administer your [\u2026]\nTrust Wills for Minor Children\nIf you have minor children, they cannot inherit your estate directly when you die. If they were to inherit while minors, a Court supervised Guardianship would have to be set up to manage the estate. The Court would then decide who the guardian is, and control when, if and how the estate is used for [\u2026]\nWashington Codicil\nEstate Planning: Washington Codicil In Washington, a codicil is simply an amendment to a will. If you need to make changes to your will, you can either redo the entire will, or if it is only a minor change, you can do it by codicil. With a codicil you usually revoke a paragraph and replace [\u2026]",
        "meta": {
            "lang": "en",
            "lang_score": 0.9506161212921143,
            "url": "http://mgrlaw.com/practice-areas/wills/",
            "timestamp": "2023-11-28T09:21:55Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.016803840877914953
                ],
                [
                    3,
                    0.0360082304526749
                ],
                [
                    4,
                    0.03017832647462277
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.044238683127572016
                ],
                [
                    6,
                    0.033950617283950615
                ],
                [
                    7,
                    0.021604938271604937
                ],
                [
                    8,
                    0.021604938271604937
                ],
                [
                    9,
                    0.021604938271604937
                ],
                [
                    10,
                    0.021604938271604937
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5263157894736842,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 591,
            "mean_word_length": 4.934010152284264,
            "num_of_sentences": 26,
            "symbol_to_word_ratio": 0.01692047377326565,
            "fraction_of_words_with_alpha_character": 0.9830795262267343,
            "num_of_stop_words": 138,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Munchies and Munchkins\nFood and travel\nOctober 5, 2015 \u00b7 by munchiesandmunchkins \u00b7 Leave a Comment\nComment *\nName *\nEmail *\nNotify me of new posts by email.\nThis site uses Akismet to reduce spam. Learn how your comment data is processed.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8647617101669312,
            "url": "http://munchiesandmunchkins.com/chai-latte-ice-cream/image-1116/",
            "timestamp": "2023-11-28T10:55:10Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05641025641025641
                ],
                [
                    3,
                    0.10256410256410256
                ],
                [
                    4,
                    0.12307692307692308
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.044444444444444446,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 43,
            "mean_word_length": 4.534883720930233,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8372093023255814,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Recent Posts\nRecent Comments\n- kmkat on Knitting adventures with Lucy\n- mary lou on New inspirations: the Staffordshire Hoard\n- Indie Design Giftalong \u2013 part 4 of 4 | Natalie Servant Designs on Indie Design Giftalong \u2013 part 3 of 4\n- Indie Design Giftalong \u2013 part 3 of 4 | Natalie Servant Designs on Indie Design Giftalong \u2013 part 2 of 4\n- Indie Design Giftalong \u2013 part 2 of 4 | Natalie Servant Designs on Indie Designer Giftalong \u2013 part 1 of 4!\n- March 2021\n- July 2018\n- June 2018\n- April 2018\n- March 2018\n- January 2018\n- November 2017\n- October 2017\n- September 2017\n- August 2017\n- July 2017\n- June 2017\n- May 2017\n- April 2017\n- March 2017\n- February 2017\n- January 2017\n- November 2016\n- October 2016\n- August 2016\n- July 2016\n- June 2016\n- May 2016\n- April 2016\n- March 2016\n- February 2016\n- January 2016\n- December 2015\n- November 2015\n- October 2015\n- September 2015\n- August 2015\n- July 2015\n- June 2015\n- May 2015\n- April 2015\n- March 2015\n- February 2015\n- January 2015\n- December 2014\n- November 2014\n- October 2014\n- September 2014\n- August 2014\n- July 2014\n- June 2014\n- May 2014\n- April 2014\n- March 2014\n- February 2014\n- January 2014\n- December 2013\n- November 2013\n- October 2013\n- September 2013\n- August 2013\n- July 2013\n- June 2013\n- May 2013\n- April 2013\n- March 2013\n- February 2013\n- January 2013\n- December 2012\n- November 2012\n- October 2012\n- September 2012\n- August 2012\n- July 2012\n- June 2012\n- May 2012\n- April 2012\n- March 2012\n- February 2012\n- January 2012\n- December 2011\n- November 2011\n- October 2011\n- September 2011\n- August 2011\n- July 2011\n- June 2011\n- May 2011\n- April 2011\n- March 2011\n- February 2011\n- January 2011\n- December 2010\n- November 2010\n- October 2010\n- September 2010\n- August 2010\n- July 2010\n- June 2010\n- April 2010\n- March 2010\n- February 2010\n- January 2010\n- December 2009\n- November 2009\n- October 2009\n- September 2009\n- August 2009\n- July 2009\n- June 2009\n- May 2009\n- April 2009\n- March 2009\n- February 2009\n- January 2009\n- November 2008\n- October 2008\n- September 2008\n- August 2008\n- July 2008\n- May 2008\n- April 2008\n- March 2008\n- January 2008\n- November 2007\n- September 2007\n- August 2007\n- July 2007\n- May 2007\n- April 2007\n- March 2007\n- February 2007\n- January 2007\n- December 2006\n- November 2006\n- October 2006\n- September 2006\n- July 2006\n- June 2006\n- May 2006\n- April 2006\n- March 2006\n- February 2006\n- January 2006\n- February 2004\nTag Archives: e-book\nSunflower Field Shawl/ Summer in Provence e-book ready available!\nThe Sunflower Field Shawl is the second in a series of shawls inspired by fields in France. One of the sights that you see in the Tour de France as the cyclists whip by are fields of sunflowers beaming at \u2026 Continue reading\nPosted in design, knitting Tagged e-book, KAL, Lavender Fields shawl, Summer in Provence, Summer in Provence e-book, Sunflower Field Shawl, Tour de France, Tour de France KAL Comments Off\nSunflower is off the needles!\nIt\u2019s been a busy week here in the land of perpetual house showings. Despite that, I\u2019ve finally managed to cast off my sunflower shawl. It\u2019s not blocked and dry yet, but here\u2019s a little preview of what it looked like \u2026 Continue reading\nPosted in design, inspiration, knitting Tagged contest, e-book, Hasmi, Lavender Fields, Rocky Mountain Dyeworks, Summer in France, Sunflower shawl, sunflowers, Tour de France 9 Comments",
        "meta": {
            "lang": "en",
            "lang_score": 0.9709111452102661,
            "url": "http://natalieservant.ca/tag/e-book/",
            "timestamp": "2023-11-28T11:10:31Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03106508875739645
                ],
                [
                    3,
                    0.03106508875739645
                ],
                [
                    4,
                    0.03883136094674556
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.07285502958579881
                ],
                [
                    6,
                    0.06360946745562131
                ],
                [
                    7,
                    0.051775147928994084
                ],
                [
                    8,
                    0.051775147928994084
                ],
                [
                    9,
                    0.019230769230769232
                ],
                [
                    10,
                    0.019230769230769232
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0074850299401197605,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.9119496855345912,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 663,
            "mean_word_length": 4.078431372549019,
            "num_of_sentences": 7,
            "symbol_to_word_ratio": 0.0030165912518853697,
            "fraction_of_words_with_alpha_character": 0.5339366515837104,
            "num_of_stop_words": 76,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "|Support for your Ob-serve system\nOb-serve offers a variety of support services to help users make the most of their Ob-serve system.\nPlease choose your product to view the details:\n\u00a9 Ob-serve Business Computing Ltd 2019\nOb-serve Homepage - Retailer Homepage - Pharmacy Homepage - Invoicer Homepage - Rentbook Homepage",
        "meta": {
            "lang": "en",
            "lang_score": 0.8735114336013794,
            "url": "http://ob-serve.co.uk/services/support.htm",
            "timestamp": "2023-11-28T09:13:42Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.13382899628252787
                ],
                [
                    3,
                    0.055762081784386616
                ],
                [
                    4,
                    0.08550185873605948
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.038461538461538464,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 50,
            "mean_word_length": 5.38,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.88,
            "num_of_stop_words": 8,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Crazy Horse Memorial- Black Hills, South DakotaOBRT2018NEW2020-08-17T03:12:46+00:00 Leave a Reply Cancel replyYour email address will not be published. Required fields are marked *Comment * Name * Email * Website Save my name, email, and website in this browser for the next time I comment.",
        "meta": {
            "lang": "en",
            "lang_score": 0.7729713320732117,
            "url": "http://ourbestroadtrips.com/crazy-horse-memorial-black-hills-south-dakota/",
            "timestamp": "2023-11-28T11:09:21Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04048582995951417
                ],
                [
                    3,
                    0.07692307692307693
                ],
                [
                    4,
                    0.09716599190283401
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 44,
            "mean_word_length": 5.613636363636363,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9318181818181818,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "|UK gay lads | Gay news UK | Gay travel and holidays UK | UK & London gay scene\nOutUK features the latest gay news, advice, entertainment and information together with gay guides to cities and holiday destinations around the UK, Europe and the rest of the world. There are hundreds of galleries of photos and videos of the sexiest gay guys plus intimate personal profiles of thousands of gay lads from all around the UK.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8270889520645142,
            "url": "http://outuk.co.uk/content/features/scary/index.html",
            "timestamp": "2023-11-28T10:39:46Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04057971014492753
                ],
                [
                    3,
                    0.028985507246376812
                ],
                [
                    4,
                    0.03188405797101449
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.02564102564102564,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 76,
            "mean_word_length": 4.5394736842105265,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9473684210526315,
            "num_of_stop_words": 24,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Aug 31, 2015\nJosh leads the crew through conversations that continually devolve into childish humor, you may laugh at us, but you are sure to laugh. Andrew, Joe and Jonathan are along for the ride discussing the S Pen concerns with the Samsung Galaxy Note 5, talk about their expectations for IFA and tablets, then discuss giving...\nAug 23, 2015\nJonathan Feist, Andrew Grush and Joe Hindy share their thoughts on Samsung\u2019s newest large sized phones. In this grab bag of an episode we also discuss a major Android Wear update, Project Ara, Alphabet and the official name for the next Android release, Android 6.0 Marshmallow. BlackBerry enjoys some airtime for...\nAug 15, 2015\nWith another Samsung launch comes every discussion about the new devices, their merits, and their faults. Unfortunately for the brand new Samsung Galaxy Note 5 and the S6 Edge Plus (happily called the \"S6 Edge Big\" by our podcasters), thoughts on the new smartphones seem lean toward the faults. And in this special...\nAug 10, 2015\nIn a week that falls between a few relly big launches, the AA Podcast team decides to table the Galaxy Note 5 talk in lieu of more pressing, security matters. Joshua Vergara is joined by Nirave Gondhia and Jonathan Feist to talk about the latest scare in the Android world: Stagefright. As a piece of malware that can...\nAug 3, 2015\nFrom a mostly quiet garage in the middle of one of Southern California's hottest summer days, Josh gets together with Jonathan Feist, Andrew Grush, and returning guest Lanh Nguyen to talk about the big launches from the previous week. Unless you were under a rock for the past 7 days, you should know that we're talking...",
        "meta": {
            "lang": "en",
            "lang_score": 0.94048011302948,
            "url": "http://podcasts.androidauthority.com/podcast/2015/08",
            "timestamp": "2023-11-28T08:48:41Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.017429193899782137
                ],
                [
                    3,
                    0.024691358024691357
                ],
                [
                    4,
                    0.020334059549745823
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 287,
            "mean_word_length": 4.7979094076655056,
            "num_of_sentences": 9,
            "symbol_to_word_ratio": 0.017421602787456445,
            "fraction_of_words_with_alpha_character": 0.9477351916376306,
            "num_of_stop_words": 67,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Tag Archives: gay marriage\nMarriage is an institution between a man and a woman, periodJuly 31, 2012\nJOHN TAMIHERE \u2013 Radio Live / Sunday News July 29 2012 This week a number of Private Members Bills were drawn from the ballot to make their way to a Private Members day which happens...\nAnglican debate on marriage risks splitting churchJuly 1, 2012\nNZ Herald 30 June 2012 Proposals being considered by the Anglican Church could see gay marriage services carried out in churches by gay priests. Bishops and priests are to vote on proposals covering the blessing...\nLatest poll on same sex marriageJune 16, 2012\nJune 2o12 Yahoo News...\nI\u2019m gay. I oppose gay marriage. Am I a bigot?June 14, 2012\nMail Online 12 June 2012 Despite the opposition of every major faith group \u2014 notably the Catholic Church \u2014 Mr Cameron is arrogantly pressing ahead with an issue which excites his chums in the metropolitan...\nWhy I\u2019m Optimistic About MarriageJune 13, 2012\nOrthodoxy.com 3 March 2011 Building off of Trevin Wax\u2019s excellent post stating the reasons he\u2019s optimistic about being pro-life, I want to follow in like manner and offer the top ten reasons I\u2019m optimistic about...\nTeachers could be forced to promote gay marriage in classrooms (UK)June 11, 2012\nTelegraph (UK) 10 June 2012 Teachers could be forced to promote same-sex marriage in classrooms if gay weddings are legalised, one of Britain\u2019s most senior human rights lawyers has warned. Parents will be powerless to...\nConservative leader supports gay marriage referendumJune 11, 2012\nTVNZ 10 June 2012 Conservative Party leader Colin Craig says he will support a referendum to allow same-sex couples to marry if New Zealanders decide they \u201care ready for a change\u201d. Labour MP Louisa Wall...\nMost homosexuals indifferent to UK gay marriageJune 10, 2012\nMail Online 8 June 2012 Homosexuals are indifferent to David Cameron\u2019s campaign for gay marriage, with fewer than four in ten believing that it is a priority for their community. And there is deep scepticism...\n\u2018Gay marriage\u2019 and homosexuality \u2013 Some medical commentsJune 10, 2012\n\u2018Gay marriage\u2019 and homosexuality \u2013 some medical comments Authors of this report: John Shea,MD, FRCP (C), Radiologist; John K. Wilson MD, FRCP (C), Cardiologist; Paul Ranalli MD, FRCP (C), Neurologist; Christina Paulaitis MD, CCFP, Family...\nSame-sex marriage hurts kidsJune 2, 2012\nThe Courier-Mail November 16, 2010 Gays are not second-class citizens but a gay man certainly makes a second-class mother. Two lesbian women may be model citizens, but neither of them can be a dad to...\nProtecting marriage to protect childrenJune 2, 2012\nLos Angeles Times 19 Sep 08 By David Blankenhorn I\u2019m a liberal Democrat. And I do not favor same-sex marriage. Do those positions sound contradictory? To me, they fit together. Many seem to believe that...\nLet us not forget the entire point of what marriage is forJune 2, 2012\nMiranda Devine The Sunday Telegraph (Aust) Intolerance has marked the entire campaign for gay marriage. The debate has been conducted with such intimidatory venom that anyone who speaks against gay marriage is crucified as an...\nBeyond Gay MarriageJune 2, 2012\nStanley Kurtz \u2013 The Weekly Standard August 2003 Among the likeliest effects of gay marriage is to take us down a slippery slope to legalized polygamy and \u201cpolyamory\u201d (group marriage). Marriage will be transformed into...\nMuslims and Sikhs attack Cameron\u2019s gay marriage planMarch 11, 2012\nTelegraph (UK) 19 March 2012 David Cameron\u2019s plan to legalise gay marriage is \u201cunnecessary and unhelpful\u201d, the country\u2019s largest Muslim organisation has said. The leader of Britain\u2019s Sikh community also attacked the proposal to extend...\nFocus of Adoption Is Best Interests of Child \u2013 Not AdultsJuly 30, 2011\nFamily First Media Release 30 July 2011 Family First NZ is rejecting a call from Labour to \u2018modernise\u2019 adoption laws. \u201cThe purpose of adoption is not to provide a child to adults, but rather to...\nSame-Sex Marriage Research DisputedJuly 19, 2011\nFamily First Media Release 19 July 2011 Family First NZ is disputing a Research NZ poll on same-sex marriage saying that similar polling in March suggests the exact opposite. \u201cThe Research NZ poll of just...",
        "meta": {
            "lang": "en",
            "lang_score": 0.93302983045578,
            "url": "http://protectmarriage.org.nz/archives/tag/gay-marriage",
            "timestamp": "2023-11-28T11:08:48Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.02498580352072686
                ],
                [
                    3,
                    0.017035775127768313
                ],
                [
                    4,
                    0.01192504258943782
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.03435547984099943
                ],
                [
                    6,
                    0.02668938103350369
                ],
                [
                    7,
                    0.011641113003975015
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.022889842632331903,
            "fraction_of_lines_ending_with_ellipsis": 0.32653061224489793,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 1,
            "num_of_toxic_words": 1,
            "word_count": 683,
            "mean_word_length": 5.156661786237189,
            "num_of_sentences": 17,
            "symbol_to_word_ratio": 0.02342606149341142,
            "fraction_of_words_with_alpha_character": 0.9048316251830161,
            "num_of_stop_words": 113,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "7 Tips for Baby-Friendly Holiday Decor from Candace Plotz Design\nI had the opportunity to chat with my interior design colleague, Candace Plotz, this week about how to decorate my studio for the upcoming holidays. With everything having to be super baby-friendly and toddler-proof, there were quite a few things that we could not do...",
        "meta": {
            "lang": "en",
            "lang_score": 0.9752161502838135,
            "url": "http://purenaturalportraits.com/2017/11/",
            "timestamp": "2023-11-28T08:44:57Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.017793594306049824
                ],
                [
                    3,
                    0.028469750889679714
                ],
                [
                    4,
                    0.07473309608540925
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 55,
            "mean_word_length": 5.109090909090909,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.01818181818181818,
            "fraction_of_words_with_alpha_character": 0.9818181818181818,
            "num_of_stop_words": 14,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Was: $39.98 Now: $33.98 you save 15%\nGot a problem? Here's your solution! It's Bob...\nPrice: $31.95\nPlease note, this product is TEMPORARILY OUT OF STOCK.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8291374444961548,
            "url": "http://radiospirits.com/P2Browse.asp?sid=NTg3MTk2NDM6Mi8xNi8yMDE5IDEwOjAwOjA5IFBN&Svr=.62&l=1&source=,,&scode=T01CY100&TotalRecordCount=79&CurrentPage=41&genre=&type=4&txtsearch=&seltype=4&selSort=0",
            "timestamp": "2023-11-28T10:30:57Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.07751937984496124
                ],
                [
                    3,
                    0.10852713178294573
                ],
                [
                    4,
                    0.15503875968992248
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.037037037037037035,
            "fraction_of_lines_ending_with_ellipsis": 0.2,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 26,
            "mean_word_length": 4.961538461538462,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.038461538461538464,
            "fraction_of_words_with_alpha_character": 0.8461538461538461,
            "num_of_stop_words": 2,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "gold furniture coffee table manufacturer\nInterior Designing | Bespoke Luxury Furniture | High End Furniture Manufacturing\nRose Gold Champagne gold Silver PVD Color Mirror 8K Finish Decorative T U L Shape 304 201 430 Stainless Steel tile trim\nProviding the decorative metal experience in residential and commercial applications",
        "meta": {
            "lang": "en",
            "lang_score": 0.7937301993370056,
            "url": "http://scanloman.com/eProductlistsid28.html",
            "timestamp": "2023-11-28T09:02:04Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04659498207885305
                ],
                [
                    3,
                    0.06810035842293907
                ],
                [
                    4,
                    0.08602150537634409
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.04,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 48,
            "mean_word_length": 5.8125,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8958333333333334,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "--> Devnullius's Choices: A list of default programs to keep your PC running well!\nOnly registered members are allowed to access this section.\nPlease login below or register an account with Samker's Computer Forum - SCforum.info.\nForgot your password?\nTerms of Use | Privacy Policy | Advertising",
        "meta": {
            "lang": "en",
            "lang_score": 0.8411024808883667,
            "url": "http://scforum.info/index.php?PHPSESSID=tlh67ggnuihk0ceiru9s9pvfh6&action=profile;u=7041",
            "timestamp": "2023-11-28T10:14:43Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.060240963855421686
                ],
                [
                    3,
                    0.09236947791164658
                ],
                [
                    4,
                    0.0963855421686747
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.2,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 47,
            "mean_word_length": 5.297872340425532,
            "num_of_sentences": 5,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9148936170212766,
            "num_of_stop_words": 7,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "|Class g: Small proteins [56992] (90 folds)\n|Fold g.3: Knottins (small inhibitors, toxins, lectins) [57015] (19 superfamilies)\ndisulfide-bound fold; contains beta-hairpin with two adjacent disulfides\n|Superfamily g.3.13: Bowman-Birk inhibitor, BBI [57247] (1 family)\n|g.3.13.1: Bowman-Birk inhibitor, BBI [57248] (1 protein)\nTimeline for Superfamily g.3.13: Bowman-Birk inhibitor, BBI:",
        "meta": {
            "lang": "en",
            "lang_score": 0.7756179571151733,
            "url": "http://scop.berkeley.edu/sunid=57247&ver=2.01",
            "timestamp": "2023-11-28T10:16:08Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.18584070796460178
                ],
                [
                    3,
                    0.16519174041297935
                ],
                [
                    4,
                    0.061946902654867256
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 47,
            "mean_word_length": 7.212765957446808,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8297872340425532,
            "num_of_stop_words": 7,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Tinder has made its Passport function freely available. Typically reserved for paying members, it allows users to change their profile location in order to match up with people across the globe. Just click on a city in the world you\u2019re interested in and begin swiping.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9410441517829895,
            "url": "http://scriptedjourneys.com/tag/tinder/",
            "timestamp": "2023-11-28T10:02:43Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04017857142857143
                ],
                [
                    3,
                    0.05803571428571429
                ],
                [
                    4,
                    0.07142857142857142
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 45,
            "mean_word_length": 4.977777777777778,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 11,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "If this is your domain name you must renew it immediately before it is deleted and permanently removed from your account. To renew this domain name visit NameBright.com",
        "meta": {
            "lang": "en",
            "lang_score": 0.9620356559753418,
            "url": "http://semaveral.com/index.php?case=archive&act=show&aid=163",
            "timestamp": "2023-11-28T10:24:15Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.14184397163120568
                ],
                [
                    3,
                    0.05673758865248227
                ],
                [
                    4,
                    0.0851063829787234
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 28,
            "mean_word_length": 5.035714285714286,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "If this is your domain name you must renew it immediately before it is deleted and permanently removed from your account. To renew this domain name visit NameBright.com",
        "meta": {
            "lang": "en",
            "lang_score": 0.9620356559753418,
            "url": "http://semaveral.com/index.php?case=archive&act=show&aid=325",
            "timestamp": "2023-11-28T10:06:05Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.14184397163120568
                ],
                [
                    3,
                    0.05673758865248227
                ],
                [
                    4,
                    0.0851063829787234
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 28,
            "mean_word_length": 5.035714285714286,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "FastCo Design \u2013 Self Care crazy comes to Design April 2017 Todd Bracher's ReCharge Cafe: At Milan Design Week, installations boast the ability to \u201crecharge,\u201d \u201cde-stress,\u201d and \u201creflect on the hectic pace of our world.\u201d View Share: Facebook, Twitter",
        "meta": {
            "lang": "en",
            "lang_score": 0.8795323967933655,
            "url": "http://site.toddbracher.com/2017/04/fastco-design-self-care-crazy-comes-to-design/",
            "timestamp": "2023-11-28T10:48:26Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05741626794258373
                ],
                [
                    3,
                    0.06220095693779904
                ],
                [
                    4,
                    0.08133971291866028
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 39,
            "mean_word_length": 5.358974358974359,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9487179487179487,
            "num_of_stop_words": 7,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Eddy \"Citizen\" Hauser Read about Ed \u2026\nDedicated to citizens, with love, by and for Citizen Ed Hauser\nReal.coop \u2234 P.O. Box 20046 \u2234 Cleveland, OH 44120\nPrivacy Policy and Terms of Use",
        "meta": {
            "lang": "en",
            "lang_score": 0.8008232116699219,
            "url": "http://smtp.realneo.us/content/cumminsfail2",
            "timestamp": "2023-11-28T10:19:43Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.087248322147651
                ],
                [
                    3,
                    0.12751677852348994
                ],
                [
                    4,
                    0.15436241610738255
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.25,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 33,
            "mean_word_length": 4.515151515151516,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.030303030303030304,
            "fraction_of_words_with_alpha_character": 0.8484848484848485,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "There are many web sites featuring current and archive photographs of Sussex Mills, as well as paintings and drawings.\nThe first table features individual mills whilst the second table features photographic collections.\nPlease contact us to recommend links for inclusion below",
        "meta": {
            "lang": "en",
            "lang_score": 0.9540775418281555,
            "url": "http://sussexmillsgroup.org.uk/links3.htm",
            "timestamp": "2023-11-28T11:21:31Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.11016949152542373
                ],
                [
                    3,
                    0.05084745762711865
                ],
                [
                    4,
                    0.0635593220338983
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 41,
            "mean_word_length": 5.7560975609756095,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 10,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Abuse (still I stayed\u2026) November 1, 2022 Visiting Blogger 1 comment \u2018\u2019If my girlfriend had cheated on me, I felt that it was a given that I would beat her up, and she\u2019d allow\u2026\u201d Have a read...",
        "meta": {
            "lang": "en",
            "lang_score": 0.9897038340568542,
            "url": "http://tboa.upphelele.co.za/tag/manipulation/",
            "timestamp": "2023-11-28T08:54:19Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.07096774193548387
                ],
                [
                    3,
                    0.07741935483870968
                ],
                [
                    4,
                    0.12903225806451613
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 1.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 37,
            "mean_word_length": 4.1891891891891895,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.08108108108108109,
            "fraction_of_words_with_alpha_character": 0.918918918918919,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "For any kind of issue, You can send your prayer request to the Primate (TCLPFW).Prayer Request\nThe Mobile Phone Lines are for: Prayer Requests Counseling Testimony sharing\nDesign by The Church of Lord World-Wide",
        "meta": {
            "lang": "en",
            "lang_score": 0.8335868716239929,
            "url": "http://tclpfw.org/livestreaming.php",
            "timestamp": "2023-11-28T08:46:58Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.033707865168539325
                ],
                [
                    3,
                    0.056179775280898875
                ],
                [
                    4,
                    0.06741573033707865
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 34,
            "mean_word_length": 5.235294117647059,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Seeker Posted July 1, 2017 Report Share Posted July 1, 2017 I quite liked the term \"differently abled\", but since I'm mundanely abled, I don't think it's any of my business to choose. Again. it's almost certainly well meant, but renaming a group of people to \"protect\" them seems awfully patronizing to me. Quote Link to comment Share on other sites More sharing options...",
        "meta": {
            "lang": "en",
            "lang_score": 0.987881064414978,
            "url": "http://ulc.net/forum/topic/163715-political-correctness-and-communication/page/3/",
            "timestamp": "2023-11-28T09:27:23Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.06451612903225806
                ],
                [
                    3,
                    0.07741935483870968
                ],
                [
                    4,
                    0.1032258064516129
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 1.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 64,
            "mean_word_length": 4.84375,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.015625,
            "fraction_of_words_with_alpha_character": 0.9375,
            "num_of_stop_words": 9,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "1 \u2014 1 of 1 Results\nFirst Friday : The Unauthorized News : Bougainville Independence Struggle (June...\nTopics discussed: Office of Hawaiian Affairs accountability, Pacific Rim Japan America Resort and Golf Executive Conference, alternative press in...\n- Duration:\n- 01:01:03",
        "meta": {
            "lang": "en",
            "lang_score": 0.7526338696479797,
            "url": "http://uluulu.hawaii.edu/titles?role=1&subject=366&template_type=block",
            "timestamp": "2023-11-28T09:32:05Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.008547008547008548
                ],
                [
                    3,
                    0.01282051282051282
                ],
                [
                    4,
                    0.021367521367521368
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.4,
            "fraction_of_lines_starting_with_bullet_point": 0.4,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 40,
            "mean_word_length": 5.85,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.05,
            "fraction_of_words_with_alpha_character": 0.775,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Call Us at (417) 773-6290\nTimber Tom November 21, 2016 Leave a Comment\nPost and Beams with custom milling\nYou must be logged in to post a comment.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8411333560943604,
            "url": "http://walstontimberframe.com/img_8415/",
            "timestamp": "2023-11-28T09:29:37Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05042016806722689
                ],
                [
                    3,
                    0.06722689075630252
                ],
                [
                    4,
                    0.1092436974789916
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 28,
            "mean_word_length": 4.25,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8571428571428571,
            "num_of_stop_words": 9,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Governors sef done join oh! See Gov Obiano and Deputy Gov Madumere doing the Ebola-shake I done laugh die. How unna check am?\n\u2014 Dem say dis salt water baff na only hypatenshon he go cause oh. My people, wishones we go do now for this Ebola? How you dey plan to do to prevent am, please share\u2026\nSo na so I hear say programmed ballot paper, programmed thumbprints and programmed vanishing ink sef, na him dey the papers wey dey flow left and right for Osun oh. Wishones my people?",
        "meta": {
            "lang": "en",
            "lang_score": 0.7751175165176392,
            "url": "http://wishones.com/author/adminadmentation-com/page/2/",
            "timestamp": "2023-11-28T08:35:56Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.031007751937984496
                ],
                [
                    3,
                    0.041343669250646
                ],
                [
                    4,
                    0.05167958656330749
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.3333333333333333,
            "fraction_of_lines_starting_with_bullet_point": 0.3333333333333333,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 91,
            "mean_word_length": 4.252747252747253,
            "num_of_sentences": 7,
            "symbol_to_word_ratio": 0.01098901098901099,
            "fraction_of_words_with_alpha_character": 0.989010989010989,
            "num_of_stop_words": 7,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "The movement from public ownership to private ownership of a company's shares either by the company's repurchase of shares or through purchases by an outside private investor.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9769983887672424,
            "url": "http://ww.vcexperts.com/reference/definitions/going-private",
            "timestamp": "2023-11-28T09:42:38Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.0738255033557047
                ],
                [
                    3,
                    0.10067114093959731
                ],
                [
                    4,
                    0.14093959731543623
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 27,
            "mean_word_length": 5.518518518518518,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 7,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "03/29/2016 | Telewave Co-Founder, President Raymond L. Collins, ex-K7EQB/W6GLN, SK\nRaymond L. Collins, ex- K7EQB/W6GLN, the president and co-founder of Telewave Inc, died on March 15.\nLearn More\n09/29/2015 | Radio Amateurs Are Among Radio Club of America 2015 Award Winners\nThe Radio Club of America (RCA) has announced the recipients of its 2015 awards, and the list includes several radio amateurs.\nLearn More",
        "meta": {
            "lang": "en",
            "lang_score": 0.9497033357620239,
            "url": "http://www.arrl.org/news/search/Tag.name:Raymond%20L.%20Collins",
            "timestamp": "2023-11-28T10:20:45Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.16666666666666666,
            "fraction_of_characters_in_duplicate_lines": 0.02586206896551724,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05172413793103448
                ],
                [
                    3,
                    0.09770114942528736
                ],
                [
                    4,
                    0.10344827586206896
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.030303030303030304,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 64,
            "mean_word_length": 5.4375,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.890625,
            "num_of_stop_words": 10,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "February 2014\nJanuary 2014\nDecember 2013\nNovember 2013\nOctober 2013\nSeptember 2013\nAugust 2013\nJuly 2013\nJune 2013\nMay 2013\nApril 2013\nMarch 2013\nAlberto Bonikowsky\nDavid Bonikowsky\nI\u00f1aki Moreno\nIsrael Piqueras\nJuan Alvarez\nPredicador Visitante\nSubscribir en RSS",
        "meta": {
            "lang": "en",
            "lang_score": 0.8851410150527954,
            "url": "http://www.bautistas-irun.org/mensajes-old1/la-nueva-vida-israel-piqueras",
            "timestamp": "2023-11-28T10:19:27Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05357142857142857
                ],
                [
                    3,
                    0.08482142857142858
                ],
                [
                    4,
                    0.10267857142857142
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.04878048780487805,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 39,
            "mean_word_length": 5.743589743589744,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.6923076923076923,
            "num_of_stop_words": 5,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Hi! Simply click below and type your query.\nOur experts will reply you very soon.\nRamghat Road, Aligarh, Uttar Pradesh\nThank you\nYour Enquiry has been sent successfully.\nHome \u203a Sitemap\nLooking for Product Name ?",
        "meta": {
            "lang": "en",
            "lang_score": 0.9146022200584412,
            "url": "http://www.bhavyapharmacy.co.in/sitemap.htm",
            "timestamp": "2023-11-28T10:29:30Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05113636363636364
                ],
                [
                    3,
                    0.07954545454545454
                ],
                [
                    4,
                    0.10795454545454546
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 36,
            "mean_word_length": 4.888888888888889,
            "num_of_sentences": 5,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9444444444444444,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "| Calendar\n| Mail Lists\n| List Archives\n| Desktop SIG\n| Hardware Hacking SIG\nWiki | Flickr | PicasaWeb | Video | Maps & Directions | Installfests | Keysignings\nLinux Cafe | Meeting Notes | Blog | Linux Links | Bling | About BLU\nHow can I issue Hayes modem commands from a Linux shell? Do I need to start Kermit and issue them from within that environment? Thanks, Chuck Noyes * Mailed from MS Exchange..... ----------------------------------- cnoyes at groucho.webo.dg.com -----------------------------------\n|BLU is a member of BostonUserGroups\n|We also thank MIT for the use of their facilities.",
        "meta": {
            "lang": "en",
            "lang_score": 0.7979887127876282,
            "url": "http://www.blu.org/mhonarc/discuss/1996/12/msg00003.php",
            "timestamp": "2023-11-28T09:04:40Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.018
                ],
                [
                    3,
                    0.02
                ],
                [
                    4,
                    0.028
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.010101010101010102,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 98,
            "mean_word_length": 5.1020408163265305,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.01020408163265306,
            "fraction_of_words_with_alpha_character": 0.7959183673469388,
            "num_of_stop_words": 13,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Monday, March 14, 2016\nNew Spring TreasuresIn: celestina marie design on etsy. Rose Garden Market., decorative painting, new shop treasures 5:00:00 AM By: Celestina Marie\nyou may also like\n49 comments:\nJust beautiful! Spring sure is in the air! And by the way I really want to eat those faux chocolate bunnies! They look so real!!\n- March 14, 2016 at 5:55 AM\n- Nancy Chan said...\nVery lovely and pretty blue and pink creations. Have a beautiful day!\n- March 14, 2016 at 5:58 AM\n- Anna said...\nLovely colors for sweet and beautiful Easter's decorations !!!!\nIt's a pity that the bunnies are in faux chocolate I prefer the true ones ;)\nHug !\n- March 14, 2016 at 6:10 AM\n- Kim said...\nFaux chocolate bunnies!?! How do you make those? How fun!\n- March 14, 2016 at 6:59 AM\n- Liz@ HomeandGardeningWithLiz said...\nThis is the 2nd blog with faux chocolate bunnies I've looked at this morning- not fair!! LOL\u2026.. They look good enough to eat! Love all the pinks!\n- March 14, 2016 at 7:23 AM\n- Gayle said...\nWonderful creations. The bunnies look so real.\n- March 14, 2016 at 7:31 AM\n- FlowerLady Lorraine said...\nYou have been so busy. I love the roses and bluebird tray, very pretty.\nHappy Creating and selling, and Happy Spring ~ FlowerLady\n- March 14, 2016 at 7:31 AM\n- Sue Kosec said...\nIsn't Springtime the best????????? It's when everything comes to life and showers us with beauty.\nHappy Spring ...\n- March 14, 2016 at 7:48 AM\n- Unknown said...\nCelestina Marie, You make the Easter celebration even more special with you beautiful work. Thanks for sharing, Happy Spring!\n- March 14, 2016 at 7:56 AM\n- craftyles said...\nSuch springy and fresh creations. Love the chocolate bunnies. Oh yes and the bluebonnets too. Have a wonderful week!\n- March 14, 2016 at 8:01 AM\n- Jemma@athomewithjemma said...\nGood Morning Pretty Lady,\nWell, these are some precious treasures and faux chocolate bunnies!\nNow who would have thought:)\nDelightful Spring joy with you this morning!\n- March 14, 2016 at 8:43 AM\n- Sandi@ Rose Chintz Cottage said...\nOh, Celestina, your creations are so sweet. I love the soft colours! Pink and aqua are always my favourites. Those faux bunnies are too cute and they look so real. As always your images are a delight to look at. Wishing you a lovely day filled with love and joy.\n- March 14, 2016 at 8:59 AM\n- Tete said...\nFaux chocolate bunnies? Going to have to google how to do those! If I lived closer to you, DH would have to take on a second job to pay for my shopping days with you. LOL\n- March 14, 2016 at 9:04 AM\nHi Celeste! Oh, such pretties you've created! Your painting is just so beautiful. The chocolate bunnies are so cute. Do you spray paint them? They really look like chocolate! :) Now I'm craving a candy bar! ;)\nBe a sweetie,\nShelia ;)\n- March 14, 2016 at 9:09 AM\n- eileeninmd said...\nHello, Celestina! You have some lovely spring creations. The baskets are adorable. I love the bunnies and the eggs. Lovely Easter decorations! Happy Monday, enjoy your new week!\n- March 14, 2016 at 9:12 AM\n- Roosterhead Designs said...\nYours must be the most beautiful Etsy shop ever!!\n(and I almost bit off those chocolate bunny ears! : ) LOL\nThanks for the inspiration and delightful peek in today Celeste~ Karen O\n- March 14, 2016 at 10:04 AM\n- Linda M. said...\nCeleste, All your spring treasures are beautiful. Joyous Wishes, Linda\n- March 14, 2016 at 10:14 AM\n- Denise said...\nsuch lovely things.\n- March 14, 2016 at 11:13 AM\n- Valerie-Jael said...\nHow beautiful you have made everything, your treasures are always so lovely to look at. Hugs, Valerie\n- March 14, 2016 at 11:18 AM\n- Dreaming of Vintage said...\nYour artwork is beautiful Celestina! It reminds me that spring is on the air!\n- March 14, 2016 at 11:19 AM\n- Rose L said...\nLove the tray with its roses and bluebird.\n- March 14, 2016 at 11:32 AM\n- kitty@ Kitty's Kozy Kitchen said...\nOoh such pretty things, sweet friend! You are so talented and I'm proud to know you! xo\n- March 14, 2016 at 11:42 AM\n- Debby Ray said...\nYou are quite the talented lady! Your painted creations are just gorgeous, Celeste! Happy Spring, even though it's not quite official yet :)\n- March 14, 2016 at 12:35 PM\n- Butterfly 8)(8 Bungalow said...\nCelestina, Everything is so pretty and feminine. I like the edge on the pink blanket and your chocolate buddies look like they could be eaten by mistake! Have a wonderful week. xoox Su\n- March 14, 2016 at 12:38 PM\n- The Polka Dot Closet said...\nOh Celeste...You are on fire! These are all gorgeous creations, the blue bird tray is gorgeous...Of course so is everything else! How fun if one year you would sell at the Polka Dot Flea...Oh my gosh it would be so fun! Thank you for your input and continued support on the Flea\n- March 14, 2016 at 1:25 PM\n- ~Lavender Dreamer~ said...\nI love that little trinket box and my favorite thing that you paint are the trays. That would be something I would put on my wish list! Happy Spring! Hugs, diane\n- March 14, 2016 at 1:47 PM\n- Daniela said...\nHow many wonderful, artistic masterpieces, my darling, precious friend, I'm so amazed by your talent, blessed be !\nThank you for sharing these stunning works of yours with us, they fill my heart with such a joy !\nHope your week is off to a great start, I wish you wonderful days to come, sending love to you\n- March 14, 2016 at 2:03 PM\n- Jill said...\nAll are just beautiful and I love the chocolate bunnies they turned out so cute!! All perfect for spring :-)\n- March 14, 2016 at 2:05 PM\n- AnnMarie aka Vintage Junkie aka NaNa said...\nAll are so pretty and bring the feeling of Spring on! Now our weather has to follow suit!\n- March 14, 2016 at 2:19 PM\n- Createology said...\nSo very \"Pretty in Pink\". Your beautiful paintngs are so delightful and really put Spring in view. I adore everything you create dear. Spring Bliss...\n- March 14, 2016 at 3:10 PM\n- Row homes and Cobblestones said...\nWow Celeste you sure have been very busy creating. I love the delicate Pink throw with your feminine signature edge techinque and OMGosh the faux chocolate bunnies make me smile. Happy creating!\n- March 14, 2016 at 7:09 PM\n- living from glory to glory said...\nHello, Yes we all seem to love pink! All your artwork is so lovely! And those Bluebonnets are so beautiful! And yes you have been busy! But I know you truly love what you do!\nEnjoy each and every day!\nHugs and Blessings, Roxy\nAlso, Happy Spring...\n- March 14, 2016 at 7:54 PM\n- Karen@Southern Gal Meets Midwest said...\nI love \"Keep it Pink\" thanks for sharing all your new and beautiful creations with us. They are a feast for the eyes :)\n- March 14, 2016 at 8:12 PM\n- Jan Hermann said...\nCeleste, you are so amazing and such a wonderful painter...I love these new items!\nJan \u2665\n- March 14, 2016 at 8:34 PM\n- Gypsy Heart said...\nI know I repeat myself over & over and I apologize, however, your talent is so amazing I can't help it! So many lovely items it's a bit difficult to say what my favorite would be. Did you make the gorgeous pink throw? It is stunning!\nThank you for sharing all the beauty with us! I'm so grateful that you're feeling better. The past couple of days have been superb with all the sunshine, right? :)\nI hope your week is filled with joy and happiness!\n- March 14, 2016 at 9:23 PM\n- Kathy said...\nAll so gorgeous and making me look forward to Spring even more!\n- March 14, 2016 at 9:31 PM\n- Betty said...\nWOW, you have been busy. Everything is so pretty and I love those signs.\n- March 14, 2016 at 10:03 PM\n- Blondie's Journal said...\nYou are one creative lady! Everything is so perfect for spring and would make lovely gifts (if we could give the up)! I love your little bluebird tray and the eggs. I'm off to look at your shop!\n- March 14, 2016 at 10:37 PM\n- Cheryl said...\nWhat a very skilled painter you are! Man-oh-man I wish I had that kinda talent. Lucky duck!\n- March 14, 2016 at 11:33 PM\n- Claudia said...\nHi Celeste, you show us wonderful Spring Treasures! I love your paintings, they are georgeous! Also your other so creative works are just beuatiful! You are so talented, my dear friend!\nThank you for sharing wonderful pictures from wonderful art-work!\nSending love and hugs and blessings, for a wonderful and joyful week, my dear friend!\nClaudia xo\n- March 15, 2016 at 12:06 AM\n- Castles Crowns and Cottages said...\nWOW you are productive. I want to do a simple pencil sketch of Paris, but do ya think I even have a moment to do so? NO! How lovely all your colors are and those bunnies....sweet as jelly beans! teehhehe\n- March 15, 2016 at 5:01 AM\n- Conniecrafter said...\nAbsolutely Beautiful creations, you are blessed with very creative talents and do such amazing work in all your projects, Love the painted eggs, I think they are my favorite of all of them :)\n- March 15, 2016 at 9:45 AM\n- Lisa said...\nCelestine you are so talented! I want it all! Those chocolate bunnies are absolutely adorable!\n- March 15, 2016 at 9:49 AM\n- Alessandra said...\nYour painted creations are gorgeous! They are all such beautiful,very romantic. I love the pastel colours and every single detail. They are work of art and you are a great artist. The bunnies are stunning, amazing!\n- March 15, 2016 at 3:58 PM\n- Creations By Cindy said...\nOh my goodness! Everything is so beautiful! I love the aqua and rose eggs. How BEAUTIFUL! You have so many timeless treasures. Hugs and blessings, Cindy\n- March 15, 2016 at 6:23 PM\n- Feral Turtle said...\nYou are so talented Celeste! Love your creations. You definitely tricked me with your adorable bunnies!!!\n- March 16, 2016 at 6:54 AM\n- handmade by amalia said...\nSo much spring prettiness in one post! You are a talented artiest, my friend!\n- March 16, 2016 at 6:57 AM\n- Mary@mydogsmygardenandmary said...\nWOW so many beautiful items that you have made. Love the throw. You are so talented.....\nHave a great week my friend.\n- March 16, 2016 at 4:35 PM\n- cynthia lee designs said...\nI just love all your creations. The chocolate bunnies are adorable.\n- March 17, 2016 at 7:59 PM\nPost a Comment\nThank you for stopping by. Your visits and comments are always welcome and I look forward to visiting you in return. Have a blessed day!\nNote: Only a member of this blog may post a comment.\nCelestina Marie\nWelcome To Rose Garden Market from Celestina Marie Design. It is so nice to meet you. My name is Celestina Marie named after my grandmother and my friends call me Celeste.My creative journey extends over 30 years enjoying the love of painting and redesigning vintage and new treasures. I love to go treasure hunting and the fun of finding great vintage pieces to redesign..\nBlog Archive\n- \u25ba 2017 (24)\n- \u25bc March (10)\n- \u25ba February (13)\n- \u25ba December (18)\n- \u25ba November (15)\n- \u25ba October (16)\n- \u25ba September (14)\n- \u25ba August (8)\n- \u25ba July (13)\n- \u25ba June (13)\n- \u25ba May (15)\n- \u25ba April (13)\n- \u25ba March (15)\n- \u25ba February (13)\n- \u25ba December (15)\n- \u25ba November (11)\n- \u25ba October (11)\n- \u25ba September (11)\n- \u25ba August (9)\n- \u25ba July (7)\n- \u25ba June (13)\n- \u25ba May (12)\n- \u25ba April (12)\n- \u25ba March (9)\n- \u25ba February (9)\n- \u25ba December (20)\n- \u25ba November (7)\n- \u25ba October (8)\n- \u25ba May (13)\n- \u25ba April (12)\n- \u25ba March (11)\n- \u25ba February (9)\n- \u25ba December (17)\n- \u25ba November (14)\n- \u25ba October (11)\n- \u25ba September (8)\n- \u25ba July (7)\n- \u25ba May (8)\n- \u25ba April (9)\n- \u25ba March (10)\n- \u25ba February (9)\n- \u25ba December (16)\n- \u25ba October (9)\n- \u25ba August (13)\n- \u25ba July (10)\n- \u25ba June (12)\n- \u25ba May (9)\n- \u25ba December (14)\n- \u25ba November (10)\n- \u25ba October (11)\n- \u25ba September (8)\n- \u25ba August (9)\n- \u25ba July (12)\n- \u25ba June (10)\n- \u25ba May (7)\n- \u25ba December (8)\n- \u25ba October (22)\n- \u25ba July (7)\n- \u25ba 2008 (48)\n- \u25ba November (7)",
        "meta": {
            "lang": "en",
            "lang_score": 0.9329434037208557,
            "url": "http://www.celestinamariedesign.com/2016/03/new-spring-treasures.html",
            "timestamp": "2023-11-28T08:53:35Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0546218487394958,
            "fraction_of_characters_in_duplicate_lines": 0.01756264724780467,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.012636538873420432
                ],
                [
                    3,
                    0.05140286999357464
                ],
                [
                    4,
                    0.054294281430713215
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.09787963161276504
                ],
                [
                    6,
                    0.026986506746626688
                ],
                [
                    7,
                    0.02066823730991647
                ],
                [
                    8,
                    0.0054615549368173056
                ],
                [
                    9,
                    0.003105590062111801
                ],
                [
                    10,
                    0.003105590062111801
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.049265341400172864,
            "fraction_of_lines_ending_with_ellipsis": 0.14488636363636365,
            "fraction_of_lines_starting_with_bullet_point": 0.4431818181818182,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 2200,
            "mean_word_length": 4.244545454545454,
            "num_of_sentences": 151,
            "symbol_to_word_ratio": 0.02590909090909091,
            "fraction_of_words_with_alpha_character": 0.7954545454545454,
            "num_of_stop_words": 287,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "OwnYourShop.com brings eCommerce to your site...\nHong Kong March 28, 2001 - OwnYourShop.com is a leading eCommerce enabler (ASP) targeting SME around the globe, the company's objective is to help SME to start their own on-line shop with easy management and cost effective solutions.\nOwnYourShop.com brings enterprise level of eCommerce features like coupons and up-selling without the hassle of investment in expensive hardware, software and bandwidth. The shop cost is purely based on the number of products the shop owner wishes to make available on the Web site! The low monthly rates make OwnYourShop.com the perfect eCommerce solution for SME business.\nOwnYourShop.com has also teamed up with Planet Payment (http://www.planetpayment.com), a well known international merchant account service provider based in New York, USA and branches in UK and Singapore. We have created a complete solution to help your business to accept on-line credit card and to sell your products online in 146 currencies and receive funds in one of 22 currencies. Planet Payment has solutions for vendors of all sizes, inside or outside of the United States. Successful eCommerce merchants were around the globe, such as USA, Hong Kong, Tokyo, Singapore, Paris, Australia...\nDoing on-line business couldn't be easier now, own your on-line shop as low as US$19.95 (HK$155.00) per month.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9389031529426575,
            "url": "http://www.chitao.com/the.company/news.asp?news.id=31",
            "timestamp": "2023-11-28T10:39:52Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03633217993079585
                ],
                [
                    3,
                    0.025951557093425604
                ],
                [
                    4,
                    0.02768166089965398
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.4,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 211,
            "mean_word_length": 5.478672985781991,
            "num_of_sentences": 8,
            "symbol_to_word_ratio": 0.009478672985781991,
            "fraction_of_words_with_alpha_character": 0.976303317535545,
            "num_of_stop_words": 43,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Pleasantly Uneven: A Review of A New Evangelical Manifesto for SpeakEasy Bloggers\nA New Evangelical Manifesto: A Kingdom Vision of the Common Good Edited by David P. Gushee 240 pp. Chalice Press. $24.99. I\u2019ll go ahead and shoot straight here: when I\u2026",
        "meta": {
            "lang": "en",
            "lang_score": 0.7652167677879333,
            "url": "http://www.christianhumanist.org/tag/a-new-evangelical-manifesto/",
            "timestamp": "2023-11-28T08:36:25Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03827751196172249
                ],
                [
                    3,
                    0.14354066985645933
                ],
                [
                    4,
                    0.11483253588516747
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 42,
            "mean_word_length": 4.976190476190476,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.023809523809523808,
            "fraction_of_words_with_alpha_character": 0.9523809523809523,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Driven Far Off\nThe latest on the indie, alternative, and rock music scene including news, music, contest, interviews, and more. Best described as your favorite place to find new bands.\nJuly 19, 2007 By Bryce Jacobson Leave a Comment",
        "meta": {
            "lang": "en",
            "lang_score": 0.944537341594696,
            "url": "http://www.drivenfaroff.com/contests/playradioplay/",
            "timestamp": "2023-11-28T10:39:45Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04639175257731959
                ],
                [
                    3,
                    0.061855670103092786
                ],
                [
                    4,
                    0.07731958762886598
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 39,
            "mean_word_length": 4.9743589743589745,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9487179487179487,
            "num_of_stop_words": 9,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "- Fugitive caught 3 days after escape from hospital\n- Mayplace Hotel marks ninth anniversary with room promotions\n- World Cup in Saudi Arabia sparks human rights protest\n- Visa applications open for additional 12,900 foreign workers\n- Hyundai to develop own cheaper batteries for EVs\n- [Test Drive] Upgraded Polestar 2 dons Iron Man mask\n- [Bills in Focus] Broader offshore financial support, mobility regulatory sandbox\n- Central Asia, S. Korea pledge to strengthen youth cooperation\n- Samsung family to sell stakes worth W2.6tr to pay tax\n- S. Korea, Thailand to work to resolve entry denial claims\n- \ud569\uc758\ubb38\ub3c4 \uc5c6\ub294 \ud76c\ud55c\ud55c \ubd81\u00b7\ub7ec \uc815\uc0c1\ud68c\ub2f4\u2026\uacb0\uad6d \ube44\uc988\ub2c8\uc2a4 \uad00\uacc4\uc600\ub098\n- [\uc774\ubc88 \uc8fc \ub9ac\ubdf0]\u7f8e Fed \uae30\uc900\uae08\ub9ac \ub3d9\uacb0\u2026\uc774\uc7ac\uba85 \uccb4\ud3ec\ub3d9\uc758\uc548 \uac00\uacb0(18~23\uc77c)\n- Incheon Airport passenger traffic to recover during Chuseok holiday\n- \ud55c\ub3d9\ud6c8, \uccb4\ud3ec\uc548 \uc124\uba85 8\ubd84 \ub118\uae30\uc790\u2026\u201c\uc9e7\uac8c \ud569\uc2dc\ub2e4\u201d \u201c\uc65c \uc774\ub9ac \uc2dc\ub044\ub7fd\ub0d0\u201d\n- \uc57c\ub2f9 29\uba85 \ubc18\ub780, \uc774\uc7ac\uba85 \ubc29\ud0c4 \ub6ab\ub838\ub2e4\n- FSS issues advisories to fisheries cooperatives federation for W50b investment loss\n- Biden picks top Asia aide as nominee for deputy secretary of state\n- Solo Korean trekker found dead in Himalayas\n- PPP decides to lift membership suspensions of ex\n- English chatbot services to be available for public bike users\n- Arrest warrant sought for ex\n- S. Korea's inflation grows faster, stays over 3 pct for third month in Oct.\n- \u2018It\u2019s OK to put fried chicken, ramen on jesa table\u2019\n- Asiana Airlines board to reconvene to vote on cargo biz sell\n- Israeli military jets strike Gaza, says Hamas commander killed\n- Indonesia\u2019s upcycling startup wins Korea\n- Embracing setbacks: KAIST students vie for the inaugural 'worst failure' crown\n- S. Korean military detects signs of NK supplying ballistic missiles to Russia",
        "meta": {
            "lang": "en",
            "lang_score": 0.815211296081543,
            "url": "http://www.einwandverwandler.com/haxomjh/",
            "timestamp": "2023-11-28T09:10:40Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.006666666666666667
                ],
                [
                    3,
                    0.011111111111111112
                ],
                [
                    4,
                    0.011851851851851851
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.04421768707482993,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.9333333333333333,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 281,
            "mean_word_length": 4.804270462633452,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.010676156583629894,
            "fraction_of_words_with_alpha_character": 0.7829181494661922,
            "num_of_stop_words": 28,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Work Programme\nRead our latest European Schoolnet's work programme and discover our roadmap to transform and offer value the education community? Every year European Schoolnet Steering Committee members confirmed new priorities.\nFind out this and much more in our latest Work Programme.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8759346604347229,
            "url": "http://www.eun.org/work-programme;jsessionid=0445CC466044E593485B7B9936BFC2CD",
            "timestamp": "2023-11-28T10:07:31Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.10612244897959183
                ],
                [
                    3,
                    0.06938775510204082
                ],
                [
                    4,
                    0.08163265306122448
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 42,
            "mean_word_length": 5.833333333333333,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 7,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Online Encyclopedia\n1 E11 m\nTo help compare distances at different orders of magnitude this page lists lengths starting at 1011 metres (100 million kilometres or 0.7 astronomical units).\n- Distances shorter than 1011 m\n- 108 million km -- 0.7 AU -- Distance between Venus and the Sun\n- 150 million km -- 1.0 AU -- Distance between the Earth and the Sun\n- 228 million km -- 1.5 AU -- Distance between Mars and the Sun\n- 290 million km -- 1.9 AU -- Minimum diameter of Betelgeuse\n- 480 million km -- 3.2 AU -- Maximum diameter of Betelgeuse\n- 591 million km -- 4.0 AU -- Minimum distance between the Earth and Jupiter\n- 624 million km -- 4.2 AU -- Diameter of Antares\n- 780 million km -- 5.2 AU -- Distance between Jupiter and the Sun\n- 965 million km -- 6.4 AU -- Maximum distance between the Earth and Jupiter\n- Distances longer than 1012 m\nSee also: Orders of magnitude, orders of magnitude (length)\nExternal link\nConversion Calculator for Units of LENGTH http://www.ex.ac.uk/cimt/dictunit/ccleng.htm\nLast updated: 02-05-2005 02:32:14\nLast updated: 02-09-2005 15:22:38",
        "meta": {
            "lang": "en",
            "lang_score": 0.6916611790657043,
            "url": "http://www.fact-archive.com/encyclopedia/1_E11_m%B2",
            "timestamp": "2023-11-28T09:01:18Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.09194097616345062
                ],
                [
                    3,
                    0.11237230419977298
                ],
                [
                    4,
                    0.08626560726447219
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0681044267877412
                ],
                [
                    6,
                    0.03859250851305335
                ],
                [
                    7,
                    0.03859250851305335
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.5789473684210527,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 189,
            "mean_word_length": 4.661375661375661,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.6984126984126984,
            "num_of_stop_words": 30,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "We love beautiful, sexy feet. Touching them, feeling them, licking them, wrapping them around our cock\u2026 But every now and then, a little spice and variety is nice. Not too far away from feet is the hand. Specifically, handjob. Strokies is undeniably the best handjob website online, with over 600 exclusive videos featuring 500 amateurs\u2026\nLive Foot Fetish Sessions on LiveFetishCam\nWhether you are looking for some hot ladies that will do dildo footjob sessions or you need a dominant mistress that will tell you to worship her soles then you need to go to the LiveFetishCam.com site and they have the best live foot fetish cams online. The good thing about them is that they\u2026\nBarefoot Confidential 84\nOh sweet feet! Why do we love you so? What is it about your look, your taste, your feel and your smell?! Take away a woman\u2019s feet and you take away her power. They control us. We will do anything for them. Give them to us! Watch the Full Length, High Quality Movie! Oh sweet\u2026\nSarah Cute Pampering Feet\nToday\u2019s long awaited update features Czech veteran Kristof Cale being serviced by Hungarian coed Sarah Cute. After Kristof gets naked and shows us his big uncut cock \ud83c\udf46 Sarah steps in to sniff, kiss and lick his armpits before applying some lube \ud83d\udca7 and then doing the sniff/kiss/lick think to his feet. Pictures from See Him Fuck\nTony Lovecocks Foot Pampering\nYouthful hung stud Tony Lovelocks can make his See HIM Fuck debut now and we teamed HIM up with juicy blonde Indica Monroe because of this week\u2019s ridiculously warm update! The scene begins with the 20-year-old Las Vegas? endemic showing off the rather amazing bulge in the black suit pants of his. He undresses as\u2026\nLatina Foot Freak \u2013 Cassandra Cruz\nI like Latina girls like Cassandra especially if they\u2019re bare naked and barefoot plus having all the slutty skills that I want. Cassandra has great tits and more importantly delectable feet that got me really horny. I sucked her little toes before burying my face in between her cunt. Watch Cassandra sucking my cock before\u2026\nBarefoot Confidential\nGood looking dames have all the advantages and, thereby, get away with murder. If guys tried doing what you see on this boxcover with one another, there\u2019d be talk around the office and generous distance observed in the men\u2019s room. Put the secretaries in the same situation and, besides a lot of unaccountable peepholes in\u2026\nFalaka Whipping\nFalaka feet whipping of foot fetish slaves in pain \u2013 Falaka Feet Whipping \u2013 Falaka feet whipping of suffering foot fetish slave girl Beauvoir spanked on her soles and tied to a dungeon chair. Extreme foot fetishes and bastinado of brunette falaka slave girl Beauvoir. Intense punishment and feet domination of tied up amateur submissive\u2026\nVal Steele Pampering Feet\nEnglish stud Danny Mountain can make the debut of his with us now, as we 1st watch this properly hung hunk strip naked and also shows us his big British cock. In steps inked coed Val Steele to begin servicing him. She sniffs and also licks Danny\u2019s armpit before slathering him and also his huge\u2026\nVirtual Reality Foot Fetish\nMeet Stacy Cruz. She\u00b4s a 19 year old brunette babe from the Czech Republic. Her long legs are covered by black fishnet stockings. She comes in wearing high heels on perfectly shaped feet. Soon. She sensually removes the high heel shoes. Brings her feet up to her mouth in a flexible gymnastic move and starts\u2026\nSexy Foot Fetish Pictures\nFoot sex and feet fetishes can be defined as the wild dedication to sexy feet, foot worship, foot cumshot, and barefoot admiration. All other extraordinary fetishes that have to do with sexy feet and hot legs of beautiful girls are catered to in feet porn pics with unique shots of gorgeous girls foot worshipping, licking\u2026\nFalaka Feet Whipping\nFalaka feet whipping of foot fetish slaves in pain \u2013 Falaka Feet Whipping \u2013 Falaka feet whipping of suffering foot fetish slave girl Beauvoir spanked on her soles and tied to a dungeon chair. Extreme foot fetishes and bastinado of brunette falaka slave girl Beauvoir. Intense punishment and feet domination of tied up amateur submissive\u2026\nMelody Foxx Sucking Toes\nWhen this guy meets this horny brunette in an exceedingly dodgy bar and is invited up to her chamber he\u2019s very excited. He figures he\u2019s planning to screw and get his feet worked over. Melody Foxx Sucking Toes \u2013 Follow SeeHimFuck on Reddit However seems this woman may be a very little freakier than the\u2026\nProject Nylon\nAre you looking for a little more than drab and regular sexual encounters? Do you need a little extra to get you fully aroused? Watch as these babes incorporate their nylons and stocking into some steamy and erotically lustful sex that is passionate and exotic!!! Watch the Full Length, High Quality Movie! This clip from\u2026\nSex Feet Under 3\nDo you like feet? Then you are in the right place for foot fetish fun! Watch the Full Length, High Quality Movie! This clip from Sex Feet Under 3 by be.me.fi features a foot job with a girl in some red fishnet stockings rubbing her feet all over a masked and collared boy\u2019s hard cock.\u2026\nThe Driving Lesson\nAngel and Jacqui, in thongs, are headed to the shore in Angel\u2019s \u201964 Tempest. Jacqui admires the old car, and Angel offers to teach her how to drive a stick shift. First they have to overcome the Tempest\u2019s tendency to flood, the battery nearly dies before they figure out how to get it to catch.\u2026\nMistress Opium Addictive Domination\nMistress Opium is a rare flower indeed. She is strong, dominant and sadistic and humiliation of pathetic slaves is her party piece. Watch as she subjects her slaves to more and more humiliating punishments making them suck each other off for her ultimate pleasure. Watch the Full Length, High Quality Movie! This clip from Mistress\u2026\nBarefoot Confidential 67\nGood looking dames have all the advantages and, thereby, get away with murder. If guys tried doing what you see on this boxcover with one another, there\u2019d be talk around the office and generous distance observed in the men\u2019s room. Put the secretaries in the same situation and, besides a lot of unaccountable peepholes in\u2026\nClits And Toes\nThis title marks a return to Viv\u2019s very special Leg Sex titles. Filming a lot of the footage himself, he has produced yet another homage to the beautiful legs and feet of his trademark stunning models. Watch the Full Length, High Quality Movie! This title marks a return to Viv\u2019s very special Leg Sex titles.\u2026\nFetish Fantasy: Fishnet Foot Jobs With Anal\nLet your fantasies loose with \u201cFetish Fantasy\u201d from Channel 69 Video! This film features sexy women dressed in fishnet stockings performing foot jobs before taking it hard and deep anal style. Enjoy five scenes and over two hours of fetish fantasy driven ecstasy! Watch the Full Length, High Quality Movie! Let your fantasies loose with\u2026\nFantasy Footjobs 7\nYes, Virginia, there\u2019s a Santa Claus. And yes, footman, there is a heaven occupied by pretty girls with wiggly toes and sexy arches ready to accommodate the contours of your johnson. But we suggest that waiting to die to get there is an awful waste of time when you could be snuggling under the covers\u2026\nLeg Sex In The Sun\nDouble feet-ure! If you love your women hot and dressed in stockings and pantyhose and fucking with their fine feet, then this is the one for you, man! These European hotties are horny and they know how to please and get what they want! Thank you, Viv Thomas! Watch the Full Length, High Quality Movie!\u2026\nBarefoot Confidential 68\nTry for a moment to imagine that the lovely foot that you\u2019re now caressing is like a fine glass of wine. It\u2019s been aged appropriately, eighteen years at the minimum. After you gently released the foot in question from its exquisite container, you raise it to your nose and take a deep breath. Notice, if\u2026\nFantasy Footjobs 8\nAh, the art of the footjob. If it weren\u2019t for those brave souls seeking a new kind of penile satisfaction, where would we be now? Probably staring at our toes, which in turn would lead to footjobs in any case. The brave women at the front lines of keeping foot happy men sated do so\u2026\nBarefoot Confidential 69\nCan you remember a time when feet weren\u2019t the most important thing in your life? Thankfully, those soleless days are long gone. Now, an afternoon spent thinking about the curve of a young lady\u2019s arch is one well spent. Just the thought of soft pale soles marching their way up and down your body is\u2026\nShe\u2019s Got Legs\nThese girls may be hotter than Hell, but their legs stretch from here to Heaven! Vouyer Media is pleased to announce the release of She\u2019s Got Legs, Paradise Film Entertainment\u2019s XXX tribute to smooth hips, soft thighs and perfect calves. In each scene, succulent stems, slick pussies and firm breasts are worked over with lust\u2026\nWelcome To Footville 4\nThe best foot fetish movie is back with more top pornstars who use their feet like you\u2019ve never seen before. Everything a foot lover ever wanted. Hardcore foot action! Watch the Full Length, High Quality Movie! The best foot fetish movie is back with more top pornstars who use their feet like you\u2019ve never seen\u2026",
        "meta": {
            "lang": "en",
            "lang_score": 0.9100993275642395,
            "url": "http://www.footfetishreview.com/?e=blackberry-q10-is-4g-or-not-a-dL7r0kC5",
            "timestamp": "2023-11-28T09:40:41Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.03773584905660377,
            "fraction_of_characters_in_duplicate_lines": 0.07335907335907337,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.014645187058980163
                ],
                [
                    3,
                    0.012781254160564505
                ],
                [
                    4,
                    0.020236985754227135
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.1262148848355745
                ],
                [
                    6,
                    0.1262148848355745
                ],
                [
                    7,
                    0.12222074291039808
                ],
                [
                    8,
                    0.10784183197976302
                ],
                [
                    9,
                    0.10304886166955132
                ],
                [
                    10,
                    0.09719078684595926
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.01738050900062073,
            "fraction_of_lines_ending_with_ellipsis": 0.32098765432098764,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 25,
            "num_of_toxic_words": 49,
            "word_count": 1583,
            "mean_word_length": 4.744788376500316,
            "num_of_sentences": 82,
            "symbol_to_word_ratio": 0.017056222362602652,
            "fraction_of_words_with_alpha_character": 0.9861023373341756,
            "num_of_stop_words": 337,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Hans de Ruiter presented the DIY laptop kit for the A1222 motherboard during AmiWest 2017. Some\u2026\nDay: 1 April 2018\nTony Hawk big fan of Commodore Amiga computers\nTony Hawk legendary professional skateboarder, actor and owner of Birdhouse, loved his Commodore Amiga 2000 for making\u2026\nFull release of Spencer available: Jump\u00b4n Run with challenging levels\nEntwickler-X proudly announced the full release of Spencer for AmigaOS 4.1. Spencer is a classic Jump\u00b4n\u2026\nRoad Avenger released for Commodore Amiga\nPixelglass proudly announced the full release of Road Avenger for Commodore Amiga. Road Avenger is an interactive\u2026\nNew wireless keyboard adapter for Commodore Amiga computers\nAmiga user Teemu Leppanen released a very interesting documentation on GitHub for making a wireless keyboard\u2026",
        "meta": {
            "lang": "en",
            "lang_score": 0.846389651298523,
            "url": "http://www.generationamiga.com/2018/04/01/",
            "timestamp": "2023-11-28T11:10:04Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.08408408408408409
                ],
                [
                    3,
                    0.05855855855855856
                ],
                [
                    4,
                    0.06006006006006006
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.04804804804804805
                ],
                [
                    6,
                    0.04804804804804805
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 118,
            "mean_word_length": 5.6440677966101696,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0423728813559322,
            "fraction_of_words_with_alpha_character": 0.9576271186440678,
            "num_of_stop_words": 17,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Since 2017, the partnership between BYD and GoShop changed the game in central and east-africa.\nThis combination does not exist.\nTerms and Conditions\n30-day money-back guarantee",
        "meta": {
            "lang": "en",
            "lang_score": 0.9349461793899536,
            "url": "http://www.goshop.cd/shop/sm30-30mm-insulation-with-m10-screw-5143",
            "timestamp": "2023-11-28T08:46:31Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.06578947368421052
                ],
                [
                    3,
                    0.08552631578947369
                ],
                [
                    4,
                    0.15789473684210525
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 26,
            "mean_word_length": 5.846153846153846,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9615384615384616,
            "num_of_stop_words": 6,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Server Error in Forum ApplicationAn error has occured while connecting to the database.Please contact the forum administrator.Support Error Code:- err_Access_db_connectionFile Name:- common.aspError details:-Microsoft JET Database EngineCould not use ''; file already in use.",
        "meta": {
            "lang": "en",
            "lang_score": 0.7400292754173279,
            "url": "http://www.gradiste.com/forum4/login_user.asp?FID=0&SID=1a9714cz11c79735f53358a6c9613e99",
            "timestamp": "2023-11-28T09:25:48Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04526748971193416
                ],
                [
                    3,
                    0.053497942386831275
                ],
                [
                    4,
                    0.07407407407407407
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 33,
            "mean_word_length": 7.363636363636363,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9696969696969697,
            "num_of_stop_words": 5,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "The Universe should be deemed an immense Being, always living, always moved and always moving in an eternal activity inherent in itself, and which, subordinate to no foreign cause, is communicated to all its parts, connects them together, and makes the world of things a complete and perfect whole.\nPike, Albert",
        "meta": {
            "lang": "en",
            "lang_score": 0.9471049904823303,
            "url": "http://www.greatfamousquotes.com/universe/the-universe-should-be-deemed-an/",
            "timestamp": "2023-11-28T09:57:23Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.0421455938697318
                ],
                [
                    3,
                    0.06513409961685823
                ],
                [
                    4,
                    0.07279693486590039
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 51,
            "mean_word_length": 5.117647058823529,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 14,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "About Jean Holy Smithereens\nJean is a lover of luxury travel and adventure, always looking for that \"Holy Smithereens\"-inducing moment on her travels. Follow the blog and other social media pages of Holy Smithereens to get the ultimate travel ideas for the luxurious adventurer!",
        "meta": {
            "lang": "en",
            "lang_score": 0.8576588034629822,
            "url": "http://www.holysmithereens.com/2012/06/when-in-cancun-last-part/img_0390/",
            "timestamp": "2023-11-28T10:37:37Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.1276595744680851
                ],
                [
                    3,
                    0.05531914893617021
                ],
                [
                    4,
                    0.10212765957446808
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 44,
            "mean_word_length": 5.340909090909091,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 13,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "\u25a0 Used for protection against ticks, fleas, ear lice and other similar vermin\n\u25a0 Helps with wounds, stitches and other damage to the skin of animals\n\u25a0 Improves hair and skin of animals\nWith its minerals diatomite and zeolite ANTIKRPELJ dries out and destroys skeletons of ticks, fleas, ear lice and other similar vermin and thus provides protection for your pet or domestic animal.\nIn addition to that, ANTIKRPELJ\u2019s composition has other minerals that work together to help in the recovery of the skin and hair health\nANTIKRPELJ is the organic product from natural minerals, and therefore not harmful to humans and the environment\nThe composition, method of use and the declaration is on the label.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9124675393104553,
            "url": "http://www.i-zeolit.rs/en/zeolite-for-animal-protection/antikrpelj-fungicidal-powder-from-natural-minerals/",
            "timestamp": "2023-11-28T11:21:32Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.041237113402061855
                ],
                [
                    3,
                    0.05154639175257732
                ],
                [
                    4,
                    0.06529209621993128
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.06872852233676977
                ],
                [
                    6,
                    0.06872852233676977
                ],
                [
                    7,
                    0.06872852233676977
                ],
                [
                    8,
                    0.06872852233676977
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.01694915254237288,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.375,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 116,
            "mean_word_length": 5.017241379310345,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9741379310344828,
            "num_of_stop_words": 41,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "17 Aug Blog MCT oil \u2013 Is it Healthy for you? August 17, 2022 By lokeshwaranit 0 comments An overview of MCT oil & Medium-chain Triglycerides: MCT oil is a supplement made from a type of fat called Medium-Chain Triglyc...Continue reading",
        "meta": {
            "lang": "en",
            "lang_score": 0.9358170628547668,
            "url": "http://www.innerbio.com/?page_id=E1500688",
            "timestamp": "2023-11-28T11:05:31Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.09183673469387756
                ],
                [
                    3,
                    0.04591836734693878
                ],
                [
                    4,
                    0.061224489795918366
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 41,
            "mean_word_length": 4.780487804878049,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.024390243902439025,
            "fraction_of_words_with_alpha_character": 0.8536585365853658,
            "num_of_stop_words": 2,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Fallen Aspen Leaves\n11\" x 60\" 100% silk flat crepe\nHand painted - Hand rolled edge\nI love the shapes and colors of aspen leaves, especially when they fall on the ground.\nEach scarf is individually hand painted. No two are exactly alike.\nPlease allow 10 days for delivery.",
        "meta": {
            "lang": "en",
            "lang_score": 0.9086345434188843,
            "url": "http://www.inspiredwilddesigns.com/product/fallen-aspen-leaves",
            "timestamp": "2023-11-28T09:02:43Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04932735426008968
                ],
                [
                    3,
                    0.07623318385650224
                ],
                [
                    4,
                    0.08968609865470852
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.02,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 49,
            "mean_word_length": 4.551020408163265,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8979591836734694,
            "num_of_stop_words": 8,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Julie Anne Longano | All or Nothing\nLifestyle | Experiences | Wellness | For Fun\nMarch 25, 2013\n, Julie Anne , Leave a comment\nComments *\nName *\nEmail *\nSave my name, email, and website in this browser for the next time I comment.",
        "meta": {
            "lang": "en",
            "lang_score": 0.7549252510070801,
            "url": "http://www.julieanne.com.au/2013/03/from-bali-with-love-love-and-more-love/img_5170/",
            "timestamp": "2023-11-28T09:41:54Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.0972972972972973
                ],
                [
                    3,
                    0.08648648648648649
                ],
                [
                    4,
                    0.0918918918918919
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.041666666666666664,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 46,
            "mean_word_length": 4.021739130434782,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.7608695652173914,
            "num_of_stop_words": 2,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Contact Us\nPhone: 706.882.9909\nEmail: info@lsparts.org\nPhysical & Mailing Address: 214 Bull Street, LaGrange, GA 30240\nBusiness Office Hours of Operation:\nNeed to Purchase Tickets or Pay Tuition or Fees?\nFacebook Page: www.facebook.com/LafayetteSocietyForPerformingArts.com",
        "meta": {
            "lang": "en",
            "lang_score": 0.6598145961761475,
            "url": "http://www.lsparts.org/About%20Us/Contact.html",
            "timestamp": "2023-11-28T11:03:58Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03734439834024896
                ],
                [
                    3,
                    0.06224066390041494
                ],
                [
                    4,
                    0.11203319502074689
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 33,
            "mean_word_length": 7.303030303030303,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8787878787878788,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "IMG_3021 maaritNovember 13, 2014November 19, 2014 No Comments \u00ab Previous Next \u00bb Leave a Reply Cancel replyYour email address will not be published. Required fields are marked *Comment * Name * Email * Website \u0394 This site uses Akismet to reduce spam. Learn how your comment data is processed.",
        "meta": {
            "lang": "en",
            "lang_score": 0.7620609402656555,
            "url": "http://www.maaritmaailma.com/go-west-key-west/img_3021-3/",
            "timestamp": "2023-11-28T10:40:29Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.09053497942386832
                ],
                [
                    3,
                    0.102880658436214
                ],
                [
                    4,
                    0.1522633744855967
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 49,
            "mean_word_length": 4.959183673469388,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8163265306122449,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "You are hereAnonymus 025\nBy Drainspotter - Posted on 24 April 2011\n24. April 2011\nman\u00b7hole ( mnhl ) n.\na hole through which a man can get into a sewer, conduit, etc. for repairs or inspection",
        "meta": {
            "lang": "en",
            "lang_score": 0.8466553688049316,
            "url": "http://www.manholecovers.de/an025",
            "timestamp": "2023-11-28T10:50:38Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.11612903225806452
                ],
                [
                    3,
                    0.11612903225806452
                ],
                [
                    4,
                    0.13548387096774195
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.02631578947368421,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 37,
            "mean_word_length": 4.1891891891891895,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.7837837837837838,
            "num_of_stop_words": 1,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Goddamn it. My website of 10 years was hacked last Thu \u2013 so I had to re-create the damn new site. Because four of my 82 sites were hacked and I had to take them down \u2013 I will just \u201cSIMPLIFY\u201d the site. My theatre, class, corporate, consulting sites will [\u2026] New Site!16 Aug, 2015 in Audio Book / Audition / Basic / Benefit / Event / Class / Corporate / Headshot / Images / Improv / On-Camera / Productivity / Random Thoughts / Scene Study / Theatre / Young Actors tagged acting class / acting class in Los Angeles / actors / actors head shot / actors slate / arts / business / crafts / head shots / headshots / improv / Las Vegas / los Angeles / New York / on-camera / Tokyo / working actors by Kaz (updated 3025 days ago)",
        "meta": {
            "lang": "en",
            "lang_score": 0.8993353843688965,
            "url": "http://www.matamura.com/tag/actors-slate/",
            "timestamp": "2023-11-28T10:44:49Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03633217993079585
                ],
                [
                    3,
                    0.020761245674740483
                ],
                [
                    4,
                    0.0328719723183391
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 144,
            "mean_word_length": 4.013888888888889,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.006944444444444444,
            "fraction_of_words_with_alpha_character": 0.7361111111111112,
            "num_of_stop_words": 19,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "our website\n>>> return to the\nmain gallery page by clicking here\nCopyright San Francisco Basque Cultural Center 2006\n- 2022\nSite designed by Izar and developed by Readywebgo",
        "meta": {
            "lang": "en",
            "lang_score": 0.8663689494132996,
            "url": "http://www.ondarenet.kultura.ejgv.euskadi.eus:8085/wayback/es/20221123111607/http://www.sfbcc.us/gallery/24/8HZ",
            "timestamp": "2023-11-28T10:06:58Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.06896551724137931
                ],
                [
                    3,
                    0.0896551724137931
                ],
                [
                    4,
                    0.1310344827586207
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.03333333333333333,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.14285714285714285,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 29,
            "mean_word_length": 5.0,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.8620689655172413,
            "num_of_stop_words": 3,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Powered by phpBB \u00a9 2001, 2005 phpBB Group - Design: niedermayr.cc\nGuild Wars \u00a9 2004 ArenaNet, Inc. All rights reserved. ArenaNet, Arena.Net and the ArenaNet logo are trademarks or registered trademarks of NCsoft Corporation in the U.S. and/or other countries.",
        "meta": {
            "lang": "en",
            "lang_score": 0.8795174956321716,
            "url": "http://www.order-of-phalanx.net/forum/faq.php?sid=aaa4d8ebf666c9b6221cd705f833d78d",
            "timestamp": "2023-11-28T10:37:47Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.04090909090909091
                ],
                [
                    3,
                    0.06363636363636363
                ],
                [
                    4,
                    0.06818181818181818
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.024390243902439025,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 40,
            "mean_word_length": 5.5,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.85,
            "num_of_stop_words": 7,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Saturday, May 28, 2011\nBeen shopping\n20 comments:\n- Kate said...\nHmmmm, what was that comment about quilts and cults???\n- May 28, 2011 at 4:03 PM\n- A Spoonful Of Sugar said...\nLucky you - they haven't arrived at my store yet!\n- May 28, 2011 at 4:08 PM\n- Cathy @ CabbageQuilts said...\nOoh Yum! xo\n- May 28, 2011 at 4:40 PM\n- mybeardedpigeon@gmail.com said...\nI've been shopping too! Your fabric is lovely!\n- May 28, 2011 at 4:45 PM\n- rachelmp said...\nI'm still on my fabric diet but I bought 4 pirnts at Ballarat spotlight today. Worth the trip there!\n- May 28, 2011 at 6:45 PM\n- Cathie said...\nooooh wow!\ngood to meet you yesterday Andi \u2665\n- May 28, 2011 at 7:51 PM\n- Marit said...\nmmm.... too tempting!\n; )\n- May 28, 2011 at 8:15 PM\n- Miriam said...\nGorgeous fabrics Andi!!\nI hope you, your Dad and Jake are all recovering well.\n- May 28, 2011 at 8:39 PM\n- andrea creates said...\nmore colorways-fun!\n- May 28, 2011 at 8:46 PM\n- Kristie said...\n- May 29, 2011 at 8:29 AM\n- Catherine said...\noh, lovely!\nIt was great meeting you on Friday - hope you have a good week...\n- May 29, 2011 at 9:25 AM\n- Leonie @ Cuppa and Cake said...\nOh...now I understand what you were talking about. Nice...very nice indeed!! xx\n- May 29, 2011 at 10:11 AM\n- anhaga sae / lisa said...\nI did the same today! But just picked up the reds/pinks/mustards. Lovely! Can't wait to start cutting!\n- May 29, 2011 at 9:17 PM\n- Katherine said...\nWahoo! Looks like you hit the jackpot - can't wait to see what these beauties will become.\n- May 30, 2011 at 7:29 AM\n- meli B said...\nLove the fabric and the baby quilt. Glad you are back into the swing of things. There's a half price sale at Patchwork House next week. Think I will check it out. They have some nice stuff.\n- May 30, 2011 at 8:32 PM\n- Brianna said...\nI'm glad I'm not the only one buying the whole range, feel better now! Still haven't worked out what I'm am going to make with mine, will probably just end up in the ever growing stash.\n- June 1, 2011 at 6:25 PM\n- Theresa said...\nI feel like a winner with my DS stash. Aren't we lucky! I bet there's some US girls that are a bit miffed we got some that they didn't!\n- June 3, 2011 at 3:56 PM\n- Shanna said...\nI am loving the yellows!! Jealous we didn't get those here ;o)\n- June 4, 2011 at 7:37 AM\nwell, lucky you, I would walk to australia for those, ;o)))\n- June 7, 2011 at 3:53 AM\n- Hi! My name is erica. Would you be my friend? said...\nI'm cracking myself up! I was about to tell you how jealous I was when I realized that I have this too! Yay! :D (Not yardage though...just fat quarters)\n- June 7, 2011 at 7:13 AM",
        "meta": {
            "lang": "en",
            "lang_score": 0.9645588994026184,
            "url": "http://www.patchandi.com/2011/05/been-shopping.html?showComment=1306565100330",
            "timestamp": "2023-11-28T08:51:56Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.057803468208092484
                ],
                [
                    3,
                    0.04816955684007707
                ],
                [
                    4,
                    0.0476878612716763
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.08140655105973026
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.04036697247706422,
            "fraction_of_lines_ending_with_ellipsis": 0.22988505747126436,
            "fraction_of_lines_starting_with_bullet_point": 0.4482758620689655,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 1,
            "num_of_toxic_words": 1,
            "word_count": 523,
            "mean_word_length": 3.9694072657743784,
            "num_of_sentences": 39,
            "symbol_to_word_ratio": 0.045889101338432124,
            "fraction_of_words_with_alpha_character": 0.7858508604206501,
            "num_of_stop_words": 63,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "But trusty Mary came up with the perfect idea ..... get Michelle to print the design with her fancy shmancy (and extremely awesome) new fabric printing business and ask Cindy to help out with creating the digital file. (I LOVE my crafty friends!!!)\nSo I went along last week to Frankie & Swiss headquarters to experience the magic in person and the amazing light and airy space took my breath away!! Here's a few examples of the space and the amazing pieces on display ...",
        "meta": {
            "lang": "en",
            "lang_score": 0.9402411580085754,
            "url": "http://www.patchandi.com/2011/11/diy-chic-geek-quilt.html",
            "timestamp": "2023-11-28T08:59:51Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.030927835051546393
                ],
                [
                    3,
                    0.06701030927835051
                ],
                [
                    4,
                    0.04381443298969072
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.5,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 85,
            "mean_word_length": 4.564705882352941,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.023529411764705882,
            "fraction_of_words_with_alpha_character": 0.9647058823529412,
            "num_of_stop_words": 21,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "A recent article caught my attention and it reminded me of the compatibility between design and nature. This story is about the 20 year effort by the City of Paradise Valley, Arizona to eliminate all electrical power lines and bury them underground. Having lived in this beautiful area I can tell you that it makes [...]\nI have listened to the argument on both sides of the city signage issue and my choice is clear. No matter how much you think that those billboards and clutter of signs might help to advertise your business, they harm the environment as a whole and that in turn harms everyone\u2019s business. Internet advertising and [...]\nPerhaps you have lived in an apartment or stayed in a motel and outside your window you find yourself staring into a huge billboard or some flashing neon sign. Instead of gazing out at the branches of a lovely tree or viewing a charming sidewalk you are visually blindsided by this type of pollution. Many [...]\nA new small shopping mall was completed recently and after 5 months it still sits mostly vacant. The economy certainly has something to do with that however, there are some things that can be done to create more curb appeal for this project. The architecture is very modern in style and the project sits at [...]",
        "meta": {
            "lang": "en",
            "lang_score": 0.9729899168014526,
            "url": "http://www.sancarlosjaney.com/tag/visual-pollution/",
            "timestamp": "2023-11-28T10:49:18Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.009606147934678195
                ],
                [
                    3,
                    0.013448607108549471
                ],
                [
                    4,
                    0.01921229586935639
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 1.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 224,
            "mean_word_length": 4.647321428571429,
            "num_of_sentences": 9,
            "symbol_to_word_ratio": 0.017857142857142856,
            "fraction_of_words_with_alpha_character": 0.9732142857142857,
            "num_of_stop_words": 48,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "It is currently Tue Nov 28, 2023 2:41 am\nIn total there are 3 users online :: 0 registered, 0 hidden and 3 guests (based on users active over the past 5 minutes)\nMost users ever online was 2348 on Fri Mar 13, 2020 1:57 am\nRegistered users: No registered users\nLegend: Administrators, Global moderators\nTotal posts 14919 \u2022 Total topics 478 \u2022 Total members 100 \u2022 Our newest member Justo",
        "meta": {
            "lang": "en",
            "lang_score": 0.8563199639320374,
            "url": "http://www.sciphysicsforums.com/spfbb1/index.php?sid=64f4c6d959be7250a478a769061872eb",
            "timestamp": "2023-11-28T09:41:04Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.03821656050955414
                ],
                [
                    3,
                    0.041401273885350316
                ],
                [
                    4,
                    0.050955414012738856
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 71,
            "mean_word_length": 4.422535211267606,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.7323943661971831,
            "num_of_stop_words": 13,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Broadway Locker Coordinator\nJulie Welch\nArtistic Staff\nProducing Artistic Director - Bobby Hundley\nManaging Director - Ray A. Rochelle\nResident Choreographer - Rikki Lugo\nAnthony Sands\nJacquelyn DeLeon\nBoard Members\nJerry Durgerian\nEJ Lugo\nGrants & Donor\nCommunications Associate\nBobby Hundley\nLinda K. Igarashi\nBoard of Directors\nAdvisory Board Members\nState Senator Bob Huff\nJeff De Francisco\nPhil Gold",
        "meta": {
            "lang": "en",
            "lang_score": 0.7681922316551208,
            "url": "http://www.sgvmusictheatre.org/board-of-directors.html",
            "timestamp": "2023-11-28T11:09:54Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05202312138728324
                ],
                [
                    3,
                    0.07225433526011561
                ],
                [
                    4,
                    0.08670520231213873
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.04838709677419355,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 59,
            "mean_word_length": 5.864406779661017,
            "num_of_sentences": 1,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9322033898305084,
            "num_of_stop_words": 9,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "New Products\nFind Tray Erecting Machine, Tray Erecting Machine Carton, Hotmelt Glue Erector Machine on Industry Directory, Reliable Manufacturer/Supplier/Factory from China.\n|Unit Price:\n|Min. Order:\n|1 Set/Sets\nDurable Erecting Packing Machine Carton Box Case Erector packing process\nProduct Categories : OTHER PRODUCTS > CARTON & CASE ERECTORS",
        "meta": {
            "lang": "en",
            "lang_score": 0.6798381805419922,
            "url": "http://www.shrinkpacker.net/carton-case-erectors-65/60984064.html",
            "timestamp": "2023-11-28T11:16:16Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.0802675585284281
                ],
                [
                    3,
                    0.05016722408026756
                ],
                [
                    4,
                    0.06354515050167224
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.04081632653061224,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 47,
            "mean_word_length": 6.361702127659575,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9148936170212766,
            "num_of_stop_words": 9,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Your email address will not be published. Required fields are marked *\nSave my name, email, and website in this browser for the next time I comment.\nCopyright \u00a9 2018 By Saju John Mathew. Website by Prayer United",
        "meta": {
            "lang": "en",
            "lang_score": 0.9342812895774841,
            "url": "http://www.sjmathew.com/%E0%B4%AF%E0%B5%87%E0%B4%B6%E0%B5%81%E0%B4%B5%E0%B4%BF%E0%B4%A8%E0%B5%86-%E0%B4%89%E0%B4%B3%E0%B4%B3%E0%B4%BF%E0%B5%BD-%E0%B4%95%E0%B5%88%E0%B4%95%E0%B5%8A%E0%B4%B3%E0%B5%8D%E0%B4%B3%E0%B5%81%E0%B4%AE/",
            "timestamp": "2023-11-28T11:02:26Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.05172413793103448
                ],
                [
                    3,
                    0.09195402298850575
                ],
                [
                    4,
                    0.11494252873563218
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 38,
            "mean_word_length": 4.578947368421052,
            "num_of_sentences": 4,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 0.9210526315789473,
            "num_of_stop_words": 4,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "Out of many facets of degradation of our culture, one of the worst is the decline of the basic freedoms enshrined in (but not created by) the US Constitution and Bill of Rights, this has mostly been executed by this same process of turning rights into mere priveleges, this goes that extra step by saying only educated professionals have that privilege. This same lack of ethics and understanding of basic human rights can be seen everywhere in the surveillance state and in the way police treat the citizens they are supposed to be protecting and in the courts that coerce people who cant afford a lawyer into rescinding their right to a fair trial by a jury of their peers by threatening them with a longer sentence if they refuse to plea bargain and admit they are guilty even when they know they are not.-Matt Sonnie",
        "meta": {
            "lang": "en",
            "lang_score": 0.9759474992752075,
            "url": "http://www.skepticaleye.com/2015/05/dianne-feinstein-is-enemy-of-bill-of.html",
            "timestamp": "2023-11-28T10:07:22Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 2.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.022222222222222223
                ],
                [
                    3,
                    0.023703703703703703
                ],
                [
                    4,
                    0.022222222222222223
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.0,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 146,
            "mean_word_length": 4.623287671232877,
            "num_of_sentences": 2,
            "symbol_to_word_ratio": 0.0,
            "fraction_of_words_with_alpha_character": 1.0,
            "num_of_stop_words": 46,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    },
    {
        "text": "13 Jun Gypsum Shipment\nPosted at 16:54h in News\nThe Strait of Canso Superport Corporation continues to utilize the Mulgrave Marine Terminal to support local industry. Approximately 32,000 tonnes of gypsum was offloaded in Mulgrave and trucked to the Cabot Gypsum wall board plant at Point Tupper in Richmond County. The Superport Corporation, making its...",
        "meta": {
            "lang": "en",
            "lang_score": 0.9152089953422546,
            "url": "http://www.straitsuperport.com/2023/06/",
            "timestamp": "2023-11-28T08:51:43Z",
            "cc-path": "crawl-data/CC-MAIN-2023-50/segments/1700679099281.67/warc/CC-MAIN-20231128083443-20231128113443-00000.warc.gz",
            "url_score": 0.0
        },
        "quality_signals": {
            "url_score": 0.0,
            "fraction_of_duplicate_lines": 0.0,
            "fraction_of_characters_in_duplicate_lines": 0.0,
            "fraction_of_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_duplicate_paragraphs": 0.0,
            "fraction_of_characters_in_most_common_ngram": [
                [
                    2,
                    0.016556291390728478
                ],
                [
                    3,
                    0.03642384105960265
                ],
                [
                    4,
                    0.06291390728476821
                ]
            ],
            "fraction_of_characters_in_duplicate_ngrams": [
                [
                    5,
                    0.0
                ],
                [
                    6,
                    0.0
                ],
                [
                    7,
                    0.0
                ],
                [
                    8,
                    0.0
                ],
                [
                    9,
                    0.0
                ],
                [
                    10,
                    0.0
                ]
            ],
            "fraction_of_words_corrected_in_lines": 0.0,
            "fraction_of_lines_ending_with_ellipsis": 0.3333333333333333,
            "fraction_of_lines_starting_with_bullet_point": 0.0,
            "fraction_of_lines_with_toxic_words": 0.0,
            "num_of_lines_with_toxic_words": 0,
            "num_of_toxic_words": 0,
            "word_count": 55,
            "mean_word_length": 5.490909090909091,
            "num_of_sentences": 3,
            "symbol_to_word_ratio": 0.01818181818181818,
            "fraction_of_words_with_alpha_character": 0.9636363636363636,
            "num_of_stop_words": 12,
            "num_of_paragraphs": 0,
            "has_curly_bracket": false,
            "has_lorem_ipsum": false,
            "orig_text_has_dup_lines": false
        }
    }
]