diff --git a/advertools/extract.py b/advertools/extract.py index 438b95e3..c61273ea 100644 --- a/advertools/extract.py +++ b/advertools/extract.py @@ -39,16 +39,34 @@ The recommended way of using: ->>> import advertools as adv ->>> text_list = ['This is the first #text.', 'Second #sentence is here.', -... 'Hello, how are you?', 'This #sentence is the last #sentence'] ->>> hashtag_summary = adv.extract_hashtags(text_list) ->>> hashtag_summary.keys() -dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq', - 'top_hashtags', 'overview']) +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + import advertools as adv + + text_list = ['This is the first #text.', 'Second #sentence is here.', + 'Hello, how are you?', 'This #sentence is the last #sentence'] + hashtag_summary = adv.extract_hashtags(text_list) + hashtag_summary.keys() + +.. code-block:: + + dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq', + 'top_hashtags', 'overview']) Now you can start exploring: +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + hashtag_summary + >>> hashtag_summary['overview'] {'num_posts': 4, 'num_hashtags': 4, @@ -66,6 +84,526 @@ >>> hashtag_summary['top_hashtags'] [('#sentence', 3), ('#text', 1)] +Let's explore a proper dataset of tweets, which you can generate using one of +the functions in the :ref:`twitter API ` module. + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + import advertools as adv + import pandas as pd + + tweets = pd.read_csv('data/tweets.csv') + print(tweets.shape) + tweets.head() + +==== ================================================================================================================================================ ================= + .. tweet_text followers_count +==== ================================================================================================================================================ ================= + 0 @AERIALMAGZC @penguinnyyyyy you won't be afraid if I give you a real reason :D 157 + 1 Vibing in the office to #Metallica when the boss is on a coffee break 4687 + #TheOffice https://t.co/U5vdYevvfe + 2 I feel like Ann says she likes coffee and then gets drinks that are 99% sugar and 1% coffee https://t.co/HfuBV4v3aY 104 + 3 A venti iced coffee with four pumps of white mocha, sweet cream and caramel drizzle might just be my new favorite drink. Shout out to TikTok lol 126 + 4 I was never a coffee person until I had kids. ☕️ this cup is a life saver. https://t.co/Zo0CnVuiGj 1595 + 5 Who's excited about our next Coffee Chat? We know we are!🥳 5004 + + We're also adding Representative John Bradford to this lineup to discuss redistricting in the area. You won't want to miss it! + + RSVP: https://t.co/R3YNJjJCUG + Join the meeting: https://t.co/Ho4Kx7ZZ24 https://t.co/KfPdR3hupY + 6 he paid for my coffee= husband💗 165 + 7 It's nipply outside, and now I side too :) 0 + That sounds like blowjob in front of a fire and visit with coffee after :) + I'm still out of coffee + I could have green tea instead + Hahahahahahaha + I want to spend the morning pampering you ... + 8 Good morning 😃🌞☀️ I hope everyone has a great Tuesday morning. Enjoy your day and coffee ☕️ ♥️❤️💕🥰😘 189 + 9 @MarvinMilton2 I nearly choked on my coffee 🤪 1160 +==== ================================================================================================================================================ ================= + +Extract `#hashtags` +------------------- + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + hashtag_summary = adv.extract_hashtags(tweets['tweet_text']) + hashtag_summary.keys() + +.. code-block:: + + dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq', + 'top_hashtags', 'overview']) + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + hashtag_summary['overview'] + +.. code-block:: + + {'num_posts': 2000, + 'num_hashtags': 733, + 'hashtags_per_post': 0.3665, + 'unique_hashtags': 572} + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + [h for h in hashtag_summary['hashtags'] if h][:10] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + hashtag_summary['top_hashtags'][:10] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + hashtag_summary['hashtag_freq'] + + +Extract `@mentions` +------------------- + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + mention_summary = adv.extract_mentions(tweets['tweet_text']) + mention_summary.keys() + +.. code-block:: + + dict_keys(['mentions', 'mentions_flat', 'mention_counts', 'mention_freq', + 'top_mentions', 'overview']) + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + mention_summary['overview'] + +.. code-block:: + + {'num_posts': 2000, + 'num_mentions': 1346, + 'mentions_per_post': 0.673, + 'unique_mentions': 1132} + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + pd.DataFrame(zip(mention_summary['mentions'], + mention_summary['mention_counts']), + columns=['mentions', 'count']) + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + [h for h in mention_summary['mentions'] if h][:10] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + mention_summary['top_mentions'][:10] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + mention_summary['mention_freq'] + +.. thebe-button:: + Run this code + + +Extract Currency `$ ¢ £ ¤ ¥ ֏ ؋ ₲ ₵ ₸ ₹﹩ ¢ £ ¥ ₩ ₺ ₻ ₼ ₽ ₾ ₿ ﷼` +--------------------------------------------------------------------- + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + currency_summary = adv.extract_currency(tweets['tweet_text']) + currency_summary.keys() + +.. code-block:: + + dict_keys(['currency_symbols', 'currency_symbols_flat', + 'currency_symbol_counts', 'currency_symbol_freq', + 'top_currency_symbols', 'overview', 'currency_symbol_names', + 'surrounding_text']) + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + currency_summary['overview'] + +.. code-block:: + + {'num_posts': 2000, + 'num_currency_symbols': 37, + 'currency_symbols_per_post': 0.0185, + 'unique_currency_symbols': 4} + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + currency_summary['top_currency_symbols'] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + [text for text in currency_summary['surrounding_text'] if text][:10] + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + [sym for sym in currency_summary['currency_symbol_names'] if sym][:10] + + +Extract numbers `1234567890٠١٢٣٤٥٦٧٨٩㊺𑁛𐄍𐢪⓲𑁣𐄨𐤛` +-------------------------------------------------- + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + number_summary = adv.extract_numbers(tweets['tweet_text']) + number_summary.keys() + +.. code-block:: + + dict_keys(['numbers', 'numbers_flat', 'number_counts', 'number_freq', + 'top_numbers', 'overview']) + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + number_summary['overview'] + +.. code-block:: + + {'num_posts': 2000, + 'num_numbers': 1727, + 'numbers_per_post': 0.8635, + 'unique_numbers': 257} + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + number_summary['number_freq'] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + pd.DataFrame({ + 'numbers': number_summary['numbers'], + 'counts': number_summary['number_counts'], + }).head(20) + + +Extract questions `? ¿ ; ՞ ؟ ፧ ᥅ ⁇ ⁈ ⁉ ⳺ ⳻ ⸮ ꘏ ꛷ ︖ ﹖ ? 𑅃 𞥟 ʔ ‽` +------------------------------------------------------------------ + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + question_summary = adv.extract_questions(tweets['tweet_text']) + question_summary.keys() + +.. code-block:: + + dict_keys(['question_marks', 'question_marks_flat', 'question_mark_counts', + 'question_mark_freq', 'top_question_marks', 'overview', + 'question_mark_names', 'question_text']) + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + question_summary['overview'] + +.. code-block:: + + {'num_posts': 2000, + 'num_question_marks': 321, + 'question_marks_per_post': 0.1605, + 'unique_question_marks': 1} + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + question_summary['question_text'][:25] + +.. code-block:: + + [[], + [], + [], + [], + [], + ["Who's excited about our next Coffee Chat?"], + [], + [], + [], + [], + ['@ckaiserjr @perry_ron @LILGUYISBACK Is it okay if the hot water is flavored with coffee?'], + [], + [], + [], + [], + [], + [], + [], + [], + [], + ["You think if you do that you'll loose your followers ???"], + [], + [], + ['maybe more coffee will help?'], + []] + + +Extract Exclamations `! ¡ ՜ ߹ ᥄ ‼ ⁈ ⁉ ︕ ﹗ ! 𞥞` +------------------------------------------------- + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + exclamation_summary = adv.extract_exclamations(tweets['tweet_text']) + exclamation_summary.keys() + +.. code-block:: + + dict_keys(['exclamation_marks', 'exclamation_marks_flat', + 'exclamation_mark_counts', 'exclamation_mark_freq', + 'top_exclamation_marks', 'overview', 'exclamation_mark_names', + 'exclamation_text']) + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + exclamation_summary['overview'] + +.. code-block:: + + {'num_posts': 2000, + 'num_exclamation_marks': 563, + 'exclamation_marks_per_post': 0.2815, + 'unique_exclamation_marks': 2} + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + exclamation_summary['top_exclamation_marks'] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + exclamation_summary['exclamation_text'][:15] + + +Extract Emoji 😂😭🥺🤣❤️✨🙏😍 +------------------------------ + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + emoji_summary = adv.extract_emoji(tweets['tweet_text']) + emoji_summary.keys() + +.. code-block:: + + dict_keys(['emoji', 'emoji_text', 'emoji_flat', 'emoji_flat_text', + 'emoji_counts', 'emoji_freq', 'top_emoji', 'top_emoji_text', + 'top_emoji_groups', 'top_emoji_sub_groups', 'overview']) + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + emoji_summary['overview'] + +.. code-block:: + + {'num_posts': 2000, + 'num_emoji': 1149, + 'emoji_per_post': 0.5745, + 'unique_emoji': 279} + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + pd.DataFrame({ + 'emoji': emoji_summary['emoji'], + 'emoji_name': emoji_summary['emoji_text'] + })[:20] + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + emoji_summary['top_emoji'][:20] + +.. code-block:: + + [('☕', 159), + ('😭', 72), + ('😂', 64), + ('🤣', 49), + ('🔥', 32), + ('⬛', 21), + ('🟩', 16), + ('🥰', 15), + ('😍', 15), + ('❤️', 14), + ('🍩', 14), + ('😋', 13), + ('🥺', 13), + ('🤔', 13), + ('🥲', 13), + ('🙏', 12), + ('😅', 11), + ('💖', 11), + ('💜', 11), + ('😊', 10)] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + emoji_summary['top_emoji_text'][:20] + + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + emoji_summary['top_emoji_groups'] + +.. code-block:: + + [('Smileys & Emotion', 601), + ('Food & Drink', 210), + ('People & Body', 97), + ('Symbols', 75), + ('Travel & Places', 67), + ('Animals & Nature', 33), + ('Objects', 29), + ('Activities', 26), + ('Flags', 11)] + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + emoji_summary['top_emoji_sub_groups'] + """ __all__ = ['extract', 'extract_currency', 'extract_exclamations', 'extract_hashtags', @@ -74,12 +612,13 @@ ] import re -from unicodedata import name from collections import Counter +from unicodedata import name from urllib.parse import urlparse + # from .emoji import EMOJI, EMOJI_ENTRIES -from .regex import (MENTION, HASHTAG, CURRENCY, CURRENCY_RAW, EXCLAMATION, - EXCLAMATION_MARK, QUESTION, QUESTION_MARK, URL) +from .regex import (CURRENCY, CURRENCY_RAW, EXCLAMATION, EXCLAMATION_MARK, + HASHTAG, MENTION, QUESTION, QUESTION_MARK, URL) def extract(text_list, regex, key_name, extracted=None, **kwargs): diff --git a/advertools/logs.py b/advertools/logs.py index 887af046..d3e9608a 100644 --- a/advertools/logs.py +++ b/advertools/logs.py @@ -236,7 +236,7 @@ ==== ======================================== ================ ================ ================== =============== ================== ================== ============== =============== =============== =============== ================== 0 \- \- nan nan \- nan nan \- 1 \- \- nan nan \- nan nan \- - 2 http://adver.tools/ http adver.tools / nan nan nan nan nan nan + 2 http://adver.tools/ http adver.tools / nan nan nan nan nan nan 3 \- \- nan nan \- nan nan \- 4 \- \- nan nan \- nan nan \- 5 \- \- nan nan \- nan nan \- @@ -245,6 +245,7 @@ 8 http://www.adver.tools/staging/urlytics/ http www.adver.tools /staging/urlytics/ nan nan staging urlytics nan urlytics 9 http://www.adver.tools/staging/urlytics/ http www.adver.tools /staging/urlytics/ nan nan staging urlytics nan urlytics ==== ======================================== ================ ================ ================== =============== ================== ================== ============== =============== =============== =============== ================== + Parse the ``user_agent`` column. .. thebe-button:: diff --git a/advertools/urlytics.py b/advertools/urlytics.py index c32d675f..c3bab781 100644 --- a/advertools/urlytics.py +++ b/advertools/urlytics.py @@ -27,11 +27,20 @@ The main function here is :func:`url_to_df`, which as the name suggests, converts URLs to DataFrames. ->>> urls = ['https://netloc.com/path_1/path_2?price=10&color=blue#frag_1', -... 'https://netloc.com/path_1/path_2?price=15&color=red#frag_2', -... 'https://netloc.com/path_1/path_2/path_3?size=sm&color=blue#frag_1', -... 'https://netloc.com/path_1?price=10&color=blue'] ->>> url_to_df(urls) + +.. thebe-button:: + Run this code + +.. code-block:: + :class: thebe, thebe-init + + import advertools as adv + + urls = ['https://netloc.com/path_1/path_2?price=10&color=blue#frag_1', + 'https://netloc.com/path_1/path_2?price=15&color=red#frag_2', + 'https://netloc.com/path_1/path_2/path_3?size=sm&color=blue#frag_1', + 'https://netloc.com/path_1?price=10&color=blue'] + adv.url_to_df(urls) ==== ================================================================= ======== ========== ===================== =================== ========== ======= ======= ======= ========== ============= ============= ============ .. url scheme netloc path query fragment dir_1 dir_2 dir_3 last_dir query_color query_price query_size @@ -42,6 +51,9 @@ 3 https://netloc.com/path_1?price=10&color=blue https netloc.com /path_1 price=10&color=blue path_1 nan nan path_1 blue 10 nan ==== ================================================================= ======== ========== ===================== =================== ========== ======= ======= ======= ========== ============= ============= ============ +ِA more elaborate exmaple on :ref:`how to analyze URLs ` shows how you +might use this function after obtaining a set of URLs. + * **url**: The original URLs are listed as a reference. They are decoded for easier reading, and you can set ``decode=False`` if you want to retain the original encoding. diff --git a/docs/_build/doctrees/advertools.extract.doctree b/docs/_build/doctrees/advertools.extract.doctree index 97769673..b6949128 100644 Binary files a/docs/_build/doctrees/advertools.extract.doctree and b/docs/_build/doctrees/advertools.extract.doctree differ diff --git a/docs/_build/doctrees/advertools.logs.doctree b/docs/_build/doctrees/advertools.logs.doctree index 527b53af..205613d5 100644 Binary files a/docs/_build/doctrees/advertools.logs.doctree and b/docs/_build/doctrees/advertools.logs.doctree differ diff --git a/docs/_build/doctrees/advertools.urlytics.doctree b/docs/_build/doctrees/advertools.urlytics.doctree index 266f99cc..1ccfecd8 100644 Binary files a/docs/_build/doctrees/advertools.urlytics.doctree and b/docs/_build/doctrees/advertools.urlytics.doctree differ diff --git a/docs/_build/doctrees/environment.pickle b/docs/_build/doctrees/environment.pickle index 8d2a01f6..a104b3e5 100644 Binary files a/docs/_build/doctrees/environment.pickle and b/docs/_build/doctrees/environment.pickle differ diff --git a/docs/_build/html/.buildinfo b/docs/_build/html/.buildinfo index df5ee486..225bb0c1 100644 --- a/docs/_build/html/.buildinfo +++ b/docs/_build/html/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: dcffe16a241ebe10751e1c816c8a1e5a +config: ac9e0f7445c29a29d6ca26f0baa57518 tags: 645f666f9bcd5a90fca523b33c5a78b7 diff --git a/docs/_build/html/_modules/advertools/ad_create.html b/docs/_build/html/_modules/advertools/ad_create.html index fadf47be..0036048a 100644 --- a/docs/_build/html/_modules/advertools/ad_create.html +++ b/docs/_build/html/_modules/advertools/ad_create.html @@ -233,7 +233,7 @@

Source code for advertools.ad_create

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/ad_from_string.html b/docs/_build/html/_modules/advertools/ad_from_string.html index 9b6fd85a..fec5551e 100644 --- a/docs/_build/html/_modules/advertools/ad_from_string.html +++ b/docs/_build/html/_modules/advertools/ad_from_string.html @@ -337,7 +337,7 @@

Source code for advertools.ad_from_string

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/emoji.html b/docs/_build/html/_modules/advertools/emoji.html index 43e366cb..f5f31fba 100644 --- a/docs/_build/html/_modules/advertools/emoji.html +++ b/docs/_build/html/_modules/advertools/emoji.html @@ -4960,7 +4960,7 @@

Source code for advertools.emoji

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/extract.html b/docs/_build/html/_modules/advertools/extract.html index 9e25df7a..915682e4 100644 --- a/docs/_build/html/_modules/advertools/extract.html +++ b/docs/_build/html/_modules/advertools/extract.html @@ -152,16 +152,34 @@

Source code for advertools.extract

 
 The recommended way of using:
 
->>> import advertools as adv
->>> text_list = ['This is the first #text.', 'Second #sentence is here.',
-... 'Hello, how are you?', 'This #sentence is the last #sentence']
->>> hashtag_summary = adv.extract_hashtags(text_list)
->>> hashtag_summary.keys()
-dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq',
-           'top_hashtags', 'overview'])
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    import advertools as adv
+
+    text_list = ['This is the first #text.', 'Second #sentence is here.',
+                 'Hello, how are you?', 'This #sentence is the last #sentence']
+    hashtag_summary = adv.extract_hashtags(text_list)
+    hashtag_summary.keys()
+
+.. code-block::
+
+    dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq',
+               'top_hashtags', 'overview'])
 
 Now you can start exploring:
 
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    hashtag_summary
+
 >>> hashtag_summary['overview']
 {'num_posts': 4,
  'num_hashtags': 4,
@@ -179,6 +197,526 @@ 

Source code for advertools.extract

 >>> hashtag_summary['top_hashtags']
 [('#sentence', 3), ('#text', 1)]
 
+Let's explore a proper dataset of tweets, which you can generate using one of
+the functions in the :ref:`twitter API <twitter>` module.
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    import advertools as adv
+    import pandas as pd
+
+    tweets = pd.read_csv('data/tweets.csv')
+    print(tweets.shape)
+    tweets.head()
+
+====  ================================================================================================================================================  =================
+  ..  tweet_text                                                                                                                                          followers_count
+====  ================================================================================================================================================  =================
+   0  @AERIALMAGZC @penguinnyyyyy you won't be afraid if I give you a real reason :D                                                                                  157
+   1  Vibing in the office to #Metallica when the boss is on a coffee break                                                                                          4687
+      #TheOffice https://t.co/U5vdYevvfe
+   2  I feel like Ann says she likes coffee and then gets drinks that are 99% sugar and 1% coffee https://t.co/HfuBV4v3aY                                             104
+   3  A venti iced coffee with four pumps of white mocha, sweet cream and caramel drizzle might just be my new favorite drink. Shout out to TikTok lol                126
+   4  I was never a coffee person until I had kids. ☕️ this cup is a life saver. https://t.co/Zo0CnVuiGj                                                             1595
+   5  Who's excited about our next Coffee Chat? We know we are!🥳                                                                                                    5004
+
+      We're also adding Representative John Bradford to this lineup to discuss redistricting in the area. You won't want to miss it!
+
+      RSVP: https://t.co/R3YNJjJCUG
+      Join the meeting: https://t.co/Ho4Kx7ZZ24 https://t.co/KfPdR3hupY
+   6  he paid for my coffee= husband💗                                                                                                                                165
+   7  It's nipply outside, and now I side too :)                                                                                                                        0
+      That sounds like blowjob in front of a fire and visit with coffee after :)
+      I'm still out of coffee
+      I could have green tea instead
+      Hahahahahahaha
+      I want to spend the morning pampering you ...
+   8  Good morning 😃🌞☀️ I hope everyone has a great Tuesday morning. Enjoy your day and coffee ☕️ ♥️❤️💕🥰😘                                                           189
+   9  @MarvinMilton2 I nearly choked on my coffee 🤪                                                                                                                 1160
+====  ================================================================================================================================================  =================
+
+Extract `#hashtags`
+-------------------
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    hashtag_summary = adv.extract_hashtags(tweets['tweet_text'])
+    hashtag_summary.keys()
+
+.. code-block::
+
+    dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq',
+            'top_hashtags', 'overview'])
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    hashtag_summary['overview']
+
+.. code-block::
+
+    {'num_posts': 2000,
+    'num_hashtags': 733,
+    'hashtags_per_post': 0.3665,
+    'unique_hashtags': 572}
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    [h for h in hashtag_summary['hashtags'] if h][:10]
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    hashtag_summary['top_hashtags'][:10]
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    hashtag_summary['hashtag_freq']
+
+
+Extract `@mentions`
+-------------------
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    mention_summary = adv.extract_mentions(tweets['tweet_text'])
+    mention_summary.keys()
+
+.. code-block::
+
+    dict_keys(['mentions', 'mentions_flat', 'mention_counts', 'mention_freq',
+               'top_mentions', 'overview'])
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    mention_summary['overview']
+
+.. code-block::
+
+    {'num_posts': 2000,
+    'num_mentions': 1346,
+    'mentions_per_post': 0.673,
+    'unique_mentions': 1132}
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    pd.DataFrame(zip(mention_summary['mentions'],
+                    mention_summary['mention_counts']),
+                 columns=['mentions', 'count'])
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    [h for h in mention_summary['mentions'] if h][:10]
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    mention_summary['top_mentions'][:10]
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    mention_summary['mention_freq']
+
+.. thebe-button::
+    Run this code
+
+
+Extract Currency  `$ ¢ £ ¤ ¥ ֏ ؋ ₲ ₵ ₸ ₹﹩ ¢ £ ¥ ₩ ₺ ₻ ₼ ₽ ₾ ₿ ﷼`
+---------------------------------------------------------------------
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    currency_summary = adv.extract_currency(tweets['tweet_text'])
+    currency_summary.keys()
+
+.. code-block::
+
+    dict_keys(['currency_symbols', 'currency_symbols_flat',
+               'currency_symbol_counts', 'currency_symbol_freq',
+               'top_currency_symbols', 'overview', 'currency_symbol_names',
+               'surrounding_text'])
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    currency_summary['overview']
+
+.. code-block::
+
+    {'num_posts': 2000,
+    'num_currency_symbols': 37,
+    'currency_symbols_per_post': 0.0185,
+    'unique_currency_symbols': 4}
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    currency_summary['top_currency_symbols']
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    [text for text in currency_summary['surrounding_text'] if text][:10]
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    [sym for sym in currency_summary['currency_symbol_names'] if sym][:10]
+
+
+Extract numbers `1234567890٠١٢٣٤٥٦٧٨٩㊺𑁛𐄍𐢪⓲𑁣𐄨𐤛`
+--------------------------------------------------
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    number_summary = adv.extract_numbers(tweets['tweet_text'])
+    number_summary.keys()
+
+.. code-block::
+
+    dict_keys(['numbers', 'numbers_flat', 'number_counts', 'number_freq',
+               'top_numbers', 'overview'])
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    number_summary['overview']
+
+.. code-block::
+
+    {'num_posts': 2000,
+    'num_numbers': 1727,
+    'numbers_per_post': 0.8635,
+    'unique_numbers': 257}
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    number_summary['number_freq']
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    pd.DataFrame({
+        'numbers': number_summary['numbers'],
+        'counts': number_summary['number_counts'],
+    }).head(20)
+
+
+Extract questions `? ¿ ; ՞ ؟ ፧ ᥅ ⁇ ⁈ ⁉ ⳺ ⳻ ⸮ ꘏ ꛷ ︖ ﹖ ? 𑅃 𞥟 ʔ ‽`
+------------------------------------------------------------------
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    question_summary = adv.extract_questions(tweets['tweet_text'])
+    question_summary.keys()
+
+.. code-block::
+
+    dict_keys(['question_marks', 'question_marks_flat', 'question_mark_counts',
+               'question_mark_freq', 'top_question_marks', 'overview',
+               'question_mark_names', 'question_text'])
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    question_summary['overview']
+
+.. code-block::
+
+    {'num_posts': 2000,
+    'num_question_marks': 321,
+    'question_marks_per_post': 0.1605,
+    'unique_question_marks': 1}
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    question_summary['question_text'][:25]
+
+.. code-block::
+
+    [[],
+     [],
+     [],
+     [],
+     [],
+     ["Who's excited about our next Coffee Chat?"],
+     [],
+     [],
+     [],
+     [],
+     ['@ckaiserjr @perry_ron @LILGUYISBACK Is it okay if the hot water is flavored with coffee?'],
+     [],
+     [],
+     [],
+     [],
+     [],
+     [],
+     [],
+     [],
+     [],
+     ["You think if you do that you'll loose your followers ???"],
+     [],
+     [],
+     ['maybe more coffee will help?'],
+     []]
+
+
+Extract Exclamations `! ¡ ՜ ߹ ᥄ ‼ ⁈ ⁉ ︕ ﹗ ! 𞥞`
+-------------------------------------------------
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    exclamation_summary = adv.extract_exclamations(tweets['tweet_text'])
+    exclamation_summary.keys()
+
+.. code-block::
+
+    dict_keys(['exclamation_marks', 'exclamation_marks_flat',
+               'exclamation_mark_counts', 'exclamation_mark_freq',
+               'top_exclamation_marks', 'overview', 'exclamation_mark_names',
+               'exclamation_text'])
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    exclamation_summary['overview']
+
+.. code-block::
+
+    {'num_posts': 2000,
+    'num_exclamation_marks': 563,
+    'exclamation_marks_per_post': 0.2815,
+    'unique_exclamation_marks': 2}
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    exclamation_summary['top_exclamation_marks']
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    exclamation_summary['exclamation_text'][:15]
+
+
+Extract Emoji 😂😭🥺🤣❤️✨🙏😍
+------------------------------
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    emoji_summary = adv.extract_emoji(tweets['tweet_text'])
+    emoji_summary.keys()
+
+.. code-block::
+
+    dict_keys(['emoji', 'emoji_text', 'emoji_flat', 'emoji_flat_text',
+               'emoji_counts', 'emoji_freq', 'top_emoji', 'top_emoji_text',
+               'top_emoji_groups', 'top_emoji_sub_groups', 'overview'])
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    emoji_summary['overview']
+
+.. code-block::
+
+    {'num_posts': 2000,
+    'num_emoji': 1149,
+    'emoji_per_post': 0.5745,
+    'unique_emoji': 279}
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    pd.DataFrame({
+        'emoji': emoji_summary['emoji'],
+        'emoji_name': emoji_summary['emoji_text']
+    })[:20]
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    emoji_summary['top_emoji'][:20]
+
+.. code-block::
+
+    [('☕', 159),
+     ('😭', 72),
+     ('😂', 64),
+     ('🤣', 49),
+     ('🔥', 32),
+     ('⬛', 21),
+     ('🟩', 16),
+     ('🥰', 15),
+     ('😍', 15),
+     ('❤️', 14),
+     ('🍩', 14),
+     ('😋', 13),
+     ('🥺', 13),
+     ('🤔', 13),
+     ('🥲', 13),
+     ('🙏', 12),
+     ('😅', 11),
+     ('💖', 11),
+     ('💜', 11),
+     ('😊', 10)]
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    emoji_summary['top_emoji_text'][:20]
+
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    emoji_summary['top_emoji_groups']
+
+.. code-block::
+
+    [('Smileys & Emotion', 601),
+    ('Food & Drink', 210),
+    ('People & Body', 97),
+    ('Symbols', 75),
+    ('Travel & Places', 67),
+    ('Animals & Nature', 33),
+    ('Objects', 29),
+    ('Activities', 26),
+    ('Flags', 11)]
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    emoji_summary['top_emoji_sub_groups']
+
 """
 __all__ = ['extract', 'extract_currency',
            'extract_exclamations', 'extract_hashtags',
@@ -187,12 +725,13 @@ 

Source code for advertools.extract

            ]
 
 import re
-from unicodedata import name
 from collections import Counter
+from unicodedata import name
 from urllib.parse import urlparse
+
 # from .emoji import EMOJI, EMOJI_ENTRIES
-from .regex import (MENTION, HASHTAG, CURRENCY, CURRENCY_RAW, EXCLAMATION,
-                    EXCLAMATION_MARK, QUESTION, QUESTION_MARK, URL)
+from .regex import (CURRENCY, CURRENCY_RAW, EXCLAMATION, EXCLAMATION_MARK,
+                    HASHTAG, MENTION, QUESTION, QUESTION_MARK, URL)
 
 
 
[docs]def extract(text_list, regex, key_name, extracted=None, **kwargs): @@ -904,7 +1443,7 @@

Source code for advertools.extract

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/header_spider.html b/docs/_build/html/_modules/advertools/header_spider.html index d40ebd08..adf47322 100644 --- a/docs/_build/html/_modules/advertools/header_spider.html +++ b/docs/_build/html/_modules/advertools/header_spider.html @@ -333,7 +333,7 @@

Source code for advertools.header_spider

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/knowledge_graph.html b/docs/_build/html/_modules/advertools/knowledge_graph.html index 29b273cf..db5c6f3e 100644 --- a/docs/_build/html/_modules/advertools/knowledge_graph.html +++ b/docs/_build/html/_modules/advertools/knowledge_graph.html @@ -326,7 +326,7 @@

Source code for advertools.knowledge_graph

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/kw_generate.html b/docs/_build/html/_modules/advertools/kw_generate.html index c43c71e6..f68562ec 100644 --- a/docs/_build/html/_modules/advertools/kw_generate.html +++ b/docs/_build/html/_modules/advertools/kw_generate.html @@ -402,7 +402,7 @@

Source code for advertools.kw_generate

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/logs.html b/docs/_build/html/_modules/advertools/logs.html index 62ed2d24..7cef3239 100644 --- a/docs/_build/html/_modules/advertools/logs.html +++ b/docs/_build/html/_modules/advertools/logs.html @@ -349,7 +349,7 @@

Source code for advertools.logs

 ====  ========================================  ================  ================  ==================  ===============  ==================  ==================  ==============  ===============  ===============  ===============  ==================
    0  \-                                                                            \-                                                                      nan             nan  \-               nan                          nan  \-
    1  \-                                                                            \-                                                                      nan             nan  \-               nan                          nan  \-
-   2  http://adver.tools/                      http              adver.tools        /                                                                       nan             nan  nan              nan                          nan  nan
+   2  http://adver.tools/                       http              adver.tools       /                                                                       nan             nan  nan              nan                          nan  nan
    3  \-                                                                            \-                                                                      nan             nan  \-               nan                          nan  \-
    4  \-                                                                            \-                                                                      nan             nan  \-               nan                          nan  \-
    5  \-                                                                            \-                                                                      nan             nan  \-               nan                          nan  \-
@@ -358,6 +358,7 @@ 

Source code for advertools.logs

    8  http://www.adver.tools/staging/urlytics/  http              www.adver.tools   /staging/urlytics/                                                      nan             nan  staging          urlytics                     nan  urlytics
    9  http://www.adver.tools/staging/urlytics/  http              www.adver.tools   /staging/urlytics/                                                      nan             nan  staging          urlytics                     nan  urlytics
 ====  ========================================  ================  ================  ==================  ===============  ==================  ==================  ==============  ===============  ===============  ===============  ==================
+
 Parse the ``user_agent`` column.
 
 .. thebe-button::
@@ -720,7 +721,7 @@ 

Source code for advertools.logs

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/reverse_dns_lookup.html b/docs/_build/html/_modules/advertools/reverse_dns_lookup.html index f02bc5a3..1bfe04b4 100644 --- a/docs/_build/html/_modules/advertools/reverse_dns_lookup.html +++ b/docs/_build/html/_modules/advertools/reverse_dns_lookup.html @@ -266,7 +266,7 @@

Source code for advertools.reverse_dns_lookup

-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/robotstxt.html b/docs/_build/html/_modules/advertools/robotstxt.html index 242a04bf..ce976785 100644 --- a/docs/_build/html/_modules/advertools/robotstxt.html +++ b/docs/_build/html/_modules/advertools/robotstxt.html @@ -614,7 +614,7 @@

Source code for advertools.robotstxt

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/serp.html b/docs/_build/html/_modules/advertools/serp.html index fa597b74..f0738282 100644 --- a/docs/_build/html/_modules/advertools/serp.html +++ b/docs/_build/html/_modules/advertools/serp.html @@ -1363,7 +1363,7 @@

Source code for advertools.serp

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/sitemaps.html b/docs/_build/html/_modules/advertools/sitemaps.html index 11c611e2..23a91c7c 100644 --- a/docs/_build/html/_modules/advertools/sitemaps.html +++ b/docs/_build/html/_modules/advertools/sitemaps.html @@ -679,7 +679,7 @@

Source code for advertools.sitemaps

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/spider.html b/docs/_build/html/_modules/advertools/spider.html index b3d57533..b5a12abb 100644 --- a/docs/_build/html/_modules/advertools/spider.html +++ b/docs/_build/html/_modules/advertools/spider.html @@ -1091,7 +1091,7 @@

Source code for advertools.spider

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/twitter.html b/docs/_build/html/_modules/advertools/twitter.html index 75f6c3a2..720071a3 100644 --- a/docs/_build/html/_modules/advertools/twitter.html +++ b/docs/_build/html/_modules/advertools/twitter.html @@ -1331,7 +1331,7 @@

Source code for advertools.twitter

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/url_builders.html b/docs/_build/html/_modules/advertools/url_builders.html index db8d8b5e..49e5362c 100644 --- a/docs/_build/html/_modules/advertools/url_builders.html +++ b/docs/_build/html/_modules/advertools/url_builders.html @@ -155,7 +155,7 @@

Source code for advertools.url_builders

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/urlytics.html b/docs/_build/html/_modules/advertools/urlytics.html index 398fedae..a8877b24 100644 --- a/docs/_build/html/_modules/advertools/urlytics.html +++ b/docs/_build/html/_modules/advertools/urlytics.html @@ -140,11 +140,20 @@

Source code for advertools.urlytics

 The main function here is :func:`url_to_df`, which as the name suggests,
 converts URLs to DataFrames.
 
->>> urls = ['https://netloc.com/path_1/path_2?price=10&color=blue#frag_1',
-...         'https://netloc.com/path_1/path_2?price=15&color=red#frag_2',
-...         'https://netloc.com/path_1/path_2/path_3?size=sm&color=blue#frag_1',
-...         'https://netloc.com/path_1?price=10&color=blue']
->>> url_to_df(urls)
+
+.. thebe-button::
+    Run this code
+
+.. code-block::
+    :class: thebe, thebe-init
+
+    import advertools as adv
+
+    urls = ['https://netloc.com/path_1/path_2?price=10&color=blue#frag_1',
+            'https://netloc.com/path_1/path_2?price=15&color=red#frag_2',
+            'https://netloc.com/path_1/path_2/path_3?size=sm&color=blue#frag_1',
+            'https://netloc.com/path_1?price=10&color=blue']
+    adv.url_to_df(urls)
 
 ====  =================================================================  ========  ==========  =====================  ===================  ==========  =======  =======  =======  ==========  =============  =============  ============
   ..  url                                                                scheme    netloc      path                   query                fragment    dir_1    dir_2    dir_3    last_dir    query_color      query_price  query_size
@@ -155,6 +164,9 @@ 

Source code for advertools.urlytics

    3  https://netloc.com/path_1?price=10&color=blue                      https     netloc.com  /path_1                price=10&color=blue              path_1   nan      nan      path_1      blue                      10  nan
 ====  =================================================================  ========  ==========  =====================  ===================  ==========  =======  =======  =======  ==========  =============  =============  ============
 
+ِA more elaborate exmaple on :ref:`how to analyze URLs <sitemaps>` shows how you
+might use this function after obtaining a set of URLs.
+
 * **url**: The original URLs are listed as a reference. They are decoded for
   easier reading, and you can set ``decode=False`` if you want to retain the
   original encoding.
@@ -311,7 +323,7 @@ 

Source code for advertools.urlytics

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/word_frequency.html b/docs/_build/html/_modules/advertools/word_frequency.html index 507aa36e..8f3c32cc 100644 --- a/docs/_build/html/_modules/advertools/word_frequency.html +++ b/docs/_build/html/_modules/advertools/word_frequency.html @@ -375,7 +375,7 @@

Source code for advertools.word_frequency

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/word_tokenize.html b/docs/_build/html/_modules/advertools/word_tokenize.html index a59f95f6..22d5e99f 100644 --- a/docs/_build/html/_modules/advertools/word_tokenize.html +++ b/docs/_build/html/_modules/advertools/word_tokenize.html @@ -190,7 +190,7 @@

Source code for advertools.word_tokenize

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/advertools/youtube.html b/docs/_build/html/_modules/advertools/youtube.html index d449d88a..36fb45d8 100644 --- a/docs/_build/html/_modules/advertools/youtube.html +++ b/docs/_build/html/_modules/advertools/youtube.html @@ -1281,7 +1281,7 @@

Source code for advertools.youtube

   
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_modules/index.html b/docs/_build/html/_modules/index.html index 733ac17c..85a3aea4 100644 --- a/docs/_build/html/_modules/index.html +++ b/docs/_build/html/_modules/index.html @@ -138,7 +138,7 @@

All modules for which code is available


-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/_sources/advertools.logs.rst.txt b/docs/_build/html/_sources/advertools.logs.rst.txt index b5cc037e..614d34dd 100644 --- a/docs/_build/html/_sources/advertools.logs.rst.txt +++ b/docs/_build/html/_sources/advertools.logs.rst.txt @@ -1,3 +1,4 @@ + .. automodule:: advertools.logs :members: :undoc-members: diff --git a/docs/_build/html/advertools.ad_create.html b/docs/_build/html/advertools.ad_create.html index 4b690bda..409d198d 100644 --- a/docs/_build/html/advertools.ad_create.html +++ b/docs/_build/html/advertools.ad_create.html @@ -240,7 +240,7 @@
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/advertools.ad_from_string.html b/docs/_build/html/advertools.ad_from_string.html index d29cf1b1..dd819f9e 100644 --- a/docs/_build/html/advertools.ad_from_string.html +++ b/docs/_build/html/advertools.ad_from_string.html @@ -299,7 +299,7 @@

Facebook Instant Article Ad -

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/advertools.code_recipes.html b/docs/_build/html/advertools.code_recipes.html index 0c55ce76..2ef58803 100644 --- a/docs/_build/html/advertools.code_recipes.html +++ b/docs/_build/html/advertools.code_recipes.html @@ -174,7 +174,7 @@

Submodules -

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/advertools.code_recipes.spider_strategies.html b/docs/_build/html/advertools.code_recipes.spider_strategies.html index 791918b0..a66a172e 100644 --- a/docs/_build/html/advertools.code_recipes.spider_strategies.html +++ b/docs/_build/html/advertools.code_recipes.spider_strategies.html @@ -639,7 +639,7 @@

XPath expressions for custom extraction -

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with Sphinx using a diff --git a/docs/_build/html/advertools.emoji.html b/docs/_build/html/advertools.emoji.html index fd465b18..1640a019 100644 --- a/docs/_build/html/advertools.emoji.html +++ b/docs/_build/html/advertools.emoji.html @@ -509,7 +509,7 @@

Extract Emoji from Text
-

© Copyright 2021, Elias Dabbas.

+

© Copyright 2022, Elias Dabbas.

Built with
Sphinx using a diff --git a/docs/_build/html/advertools.extract.html b/docs/_build/html/advertools.extract.html index 5fb3dad8..263a62b0 100644 --- a/docs/_build/html/advertools.extract.html +++ b/docs/_build/html/advertools.extract.html @@ -77,6 +77,13 @@
  • Emoji Tools
  • Extract Structured Entities from Text
  • Stop Words
  • @@ -175,16 +182,22 @@

    Extract Functions
    >>> import advertools as adv
    ->>> text_list = ['This is the first #text.', 'Second #sentence is here.',
    -... 'Hello, how are you?', 'This #sentence is the last #sentence']
    ->>> hashtag_summary = adv.extract_hashtags(text_list)
    ->>> hashtag_summary.keys()
    -dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq',
    -           'top_hashtags', 'overview'])
    +
    import advertools as adv
    +
    +text_list = ['This is the first #text.', 'Second #sentence is here.',
    +             'Hello, how are you?', 'This #sentence is the last #sentence']
    +hashtag_summary = adv.extract_hashtags(text_list)
    +hashtag_summary.keys()
    +
    +
    +
    dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq',
    +           'top_hashtags', 'overview'])
     

    Now you can start exploring:

    +
    hashtag_summary
    +
    +
    +

    Let's explore a proper dataset of tweets, which you can generate using one of +the functions in the twitter API module.

    +
    import advertools as adv
    +import pandas as pd
    +
    +tweets = pd.read_csv('data/tweets.csv')
    +print(tweets.shape)
    +tweets.head()
    +
    +
    + +++++ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +

    tweet_text

    followers_count

    0

    @AERIALMAGZC @penguinnyyyyy you won't be afraid if I give you a real reason :D

    157

    1

    Vibing in the office to #Metallica when the boss is on a coffee break +#TheOffice https://t.co/U5vdYevvfe

    4687

    2

    I feel like Ann says she likes coffee and then gets drinks that are 99% sugar and 1% coffee https://t.co/HfuBV4v3aY

    104

    3

    A venti iced coffee with four pumps of white mocha, sweet cream and caramel drizzle might just be my new favorite drink. Shout out to TikTok lol

    126

    4

    I was never a coffee person until I had kids. ☕️ this cup is a life saver. https://t.co/Zo0CnVuiGj

    1595

    5

    Who's excited about our next Coffee Chat? We know we are!🥳

    +

    We're also adding Representative John Bradford to this lineup to discuss redistricting in the area. You won't want to miss it!

    +

    RSVP: https://t.co/R3YNJjJCUG +Join the meeting: https://t.co/Ho4Kx7ZZ24 https://t.co/KfPdR3hupY

    +

    5004

    6

    he paid for my coffee= husband💗

    165

    7

    It's nipply outside, and now I side too :) +That sounds like blowjob in front of a fire and visit with coffee after :) +I'm still out of coffee +I could have green tea instead +Hahahahahahaha +I want to spend the morning pampering you ...

    0

    8

    Good morning 😃🌞☀️ I hope everyone has a great Tuesday morning. Enjoy your day and coffee ☕️ ♥️❤️💕🥰😘

    189

    9

    @MarvinMilton2 I nearly choked on my coffee 🤪

    1160

    + +
    +

    Extract #hashtags

    +
    hashtag_summary = adv.extract_hashtags(tweets['tweet_text'])
    +hashtag_summary.keys()
    +
    +
    +
    dict_keys(['hashtags', 'hashtags_flat', 'hashtag_counts', 'hashtag_freq',
    +        'top_hashtags', 'overview'])
    +
    +
    +
    hashtag_summary['overview']
    +
    +
    +
    {'num_posts': 2000,
    +'num_hashtags': 733,
    +'hashtags_per_post': 0.3665,
    +'unique_hashtags': 572}
    +
    +
    +
    [h for h in hashtag_summary['hashtags'] if h][:10]
    +
    +
    +
    hashtag_summary['top_hashtags'][:10]
    +
    +
    +
    hashtag_summary['hashtag_freq']
    +
    +
    +
    +
    +

    Extract @mentions

    +
    mention_summary = adv.extract_mentions(tweets['tweet_text'])
    +mention_summary.keys()
    +
    +
    +
    dict_keys(['mentions', 'mentions_flat', 'mention_counts', 'mention_freq',
    +           'top_mentions', 'overview'])
    +
    +
    +
    mention_summary['overview']
    +
    +
    +
    {'num_posts': 2000,
    +'num_mentions': 1346,
    +'mentions_per_post': 0.673,
    +'unique_mentions': 1132}
    +
    +
    +
    pd.DataFrame(zip(mention_summary['mentions'],
    +                mention_summary['mention_counts']),
    +             columns=['mentions', 'count'])
    +
    +
    +
    [h for h in mention_summary['mentions'] if h][:10]
    +
    +
    +
    mention_summary['top_mentions'][:10]
    +
    +
    +
    mention_summary['mention_freq']
    +
    +
    +
    +
    +

    Extract Currency $ ¢ £ ¤ ¥ ֏ ؋ ₲ ₵ ₸ ₹﹩ ¢ £ ¥ ₩ ₺ ₻ ₼ ₽ ₾ ₿ ﷼

    +
    currency_summary = adv.extract_currency(tweets['tweet_text'])
    +currency_summary.keys()
    +
    +
    +
    dict_keys(['currency_symbols', 'currency_symbols_flat',
    +           'currency_symbol_counts', 'currency_symbol_freq',
    +           'top_currency_symbols', 'overview', 'currency_symbol_names',
    +           'surrounding_text'])
    +
    +
    +
    currency_summary['overview']
    +
    +
    +
    {'num_posts': 2000,
    +'num_currency_symbols': 37,
    +'currency_symbols_per_post': 0.0185,
    +'unique_currency_symbols': 4}
    +
    +
    +
    currency_summary['top_currency_symbols']
    +
    +
    +
    [text for text in currency_summary['surrounding_text'] if text][:10]
    +
    +
    +
    [sym for sym in currency_summary['currency_symbol_names'] if sym][:10]
    +
    +
    +
    +
    +

    Extract numbers 1234567890٠١٢٣٤٥٦٧٨٩㊺𑁛𐄍𐢪⓲𑁣𐄨𐤛

    +
    number_summary = adv.extract_numbers(tweets['tweet_text'])
    +number_summary.keys()
    +
    +
    +
    dict_keys(['numbers', 'numbers_flat', 'number_counts', 'number_freq',
    +           'top_numbers', 'overview'])
    +
    +
    +
    number_summary['overview']
    +
    +
    +
    {'num_posts': 2000,
    +'num_numbers': 1727,
    +'numbers_per_post': 0.8635,
    +'unique_numbers': 257}
    +
    +
    +
    number_summary['number_freq']
    +
    +
    +
    pd.DataFrame({
    +    'numbers': number_summary['numbers'],
    +    'counts': number_summary['number_counts'],
    +}).head(20)
    +
    +
    +
    +
    +

    Extract questions ? ¿ ; ՞ ؟ ፧ ᥅ ⁇ ⁈ ⁉ ⳺ ⳻ ⸮ ꘏ ꛷ ︖ ﹖ ? 𑅃 𞥟 ʔ ‽

    +
    question_summary = adv.extract_questions(tweets['tweet_text'])
    +question_summary.keys()
    +
    +
    +
    dict_keys(['question_marks', 'question_marks_flat', 'question_mark_counts',
    +           'question_mark_freq', 'top_question_marks', 'overview',
    +           'question_mark_names', 'question_text'])
    +
    +
    +
    question_summary['overview']
    +
    +
    +
    {'num_posts': 2000,
    +'num_question_marks': 321,
    +'question_marks_per_post': 0.1605,
    +'unique_question_marks': 1}
    +
    +
    +
    question_summary['question_text'][:25]
    +
    +
    +
    [[],
    + [],
    + [],
    + [],
    + [],
    + ["Who's excited about our next Coffee Chat?"],
    + [],
    + [],
    + [],
    + [],
    + ['@ckaiserjr @perry_ron @LILGUYISBACK Is it okay if the hot water is flavored with coffee?'],
    + [],
    + [],
    + [],
    + [],
    + [],
    + [],
    + [],
    + [],
    + [],
    + ["You think if you do that you'll loose your followers ???"],
    + [],
    + [],
    + ['maybe more coffee will help?'],
    + []]
    +
    +
    +
    +
    +

    Extract Exclamations ! ¡ ՜ ߹ ᥄ ‼ ⁈ ⁉ ︕ ﹗ ! 𞥞

    +
    exclamation_summary = adv.extract_exclamations(tweets['tweet_text'])
    +exclamation_summary.keys()
    +
    +
    +
    dict_keys(['exclamation_marks', 'exclamation_marks_flat',
    +           'exclamation_mark_counts', 'exclamation_mark_freq',
    +           'top_exclamation_marks', 'overview', 'exclamation_mark_names',
    +           'exclamation_text'])
    +
    +
    +
    exclamation_summary['overview']
    +
    +
    +
    {'num_posts': 2000,
    +'num_exclamation_marks': 563,
    +'exclamation_marks_per_post': 0.2815,
    +'unique_exclamation_marks': 2}
    +
    +
    +
    exclamation_summary['top_exclamation_marks']
    +
    +
    +
    exclamation_summary['exclamation_text'][:15]
    +
    +
    +
    +
    +

    Extract Emoji 😂😭🥺🤣❤️✨🙏😍

    +
    emoji_summary = adv.extract_emoji(tweets['tweet_text'])
    +emoji_summary.keys()
    +
    +
    +
    dict_keys(['emoji', 'emoji_text', 'emoji_flat', 'emoji_flat_text',
    +           'emoji_counts', 'emoji_freq', 'top_emoji', 'top_emoji_text',
    +           'top_emoji_groups', 'top_emoji_sub_groups', 'overview'])
    +
    +
    +
    emoji_summary['overview']
    +
    +
    +
    {'num_posts': 2000,
    +'num_emoji': 1149,
    +'emoji_per_post': 0.5745,
    +'unique_emoji': 279}
    +
    +
    +
    pd.DataFrame({
    +    'emoji': emoji_summary['emoji'],
    +    'emoji_name': emoji_summary['emoji_text']
    +})[:20]
    +
    +
    +
    emoji_summary['top_emoji'][:20]
    +
    +
    +
    [('☕', 159),
    + ('😭', 72),
    + ('😂', 64),
    + ('🤣', 49),
    + ('🔥', 32),
    + ('⬛', 21),
    + ('🟩', 16),
    + ('🥰', 15),
    + ('😍', 15),
    + ('❤️', 14),
    + ('🍩', 14),
    + ('😋', 13),
    + ('🥺', 13),
    + ('🤔', 13),
    + ('🥲', 13),
    + ('🙏', 12),
    + ('😅', 11),
    + ('💖', 11),
    + ('💜', 11),
    + ('😊', 10)]
    +
    +
    +
    emoji_summary['top_emoji_text'][:20]
    +
    +
    +
    emoji_summary['top_emoji_groups']
    +
    +
    +
    [('Smileys & Emotion', 601),
    +('Food & Drink', 210),
    +('People & Body', 97),
    +('Symbols', 75),
    +('Travel & Places', 67),
    +('Animals & Nature', 33),
    +('Objects', 29),
    +('Activities', 26),
    +('Flags', 11)]
    +
    +
    +
    emoji_summary['top_emoji_sub_groups']
    +
    +
    extract(text_list, regex, key_name, extracted=None, **kwargs)[source]
    @@ -940,7 +1302,7 @@

    Extract Functions -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.header_spider.html b/docs/_build/html/advertools.header_spider.html index 33697468..84cbde4e 100644 --- a/docs/_build/html/advertools.header_spider.html +++ b/docs/_build/html/advertools.header_spider.html @@ -576,7 +576,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.html b/docs/_build/html/advertools.html index ba7f541f..34eccd3b 100644 --- a/docs/_build/html/advertools.html +++ b/docs/_build/html/advertools.html @@ -163,6 +163,13 @@

    SubmodulesExtract structured entities from text lists
  • 🕷 Python Status Code Checker with Response Headers
  • @@ -276,7 +283,7 @@

    Submodules -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.knowledge_graph.html b/docs/_build/html/advertools.knowledge_graph.html index 769cf29f..5444ba7b 100644 --- a/docs/_build/html/advertools.knowledge_graph.html +++ b/docs/_build/html/advertools.knowledge_graph.html @@ -296,7 +296,7 @@

    How to use Google's Knowledge Graph API -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.kw_generate.html b/docs/_build/html/advertools.kw_generate.html index 3a68b6ba..ad2a8753 100644 --- a/docs/_build/html/advertools.kw_generate.html +++ b/docs/_build/html/advertools.kw_generate.html @@ -420,7 +420,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.logs.html b/docs/_build/html/advertools.logs.html index b4a60dd9..5d337cce 100644 --- a/docs/_build/html/advertools.logs.html +++ b/docs/_build/html/advertools.logs.html @@ -1736,6 +1736,181 @@

    Log File Analysis - Data Preparationreferer_url_df.head(10)

    + +++++++++++++++ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +

    referer_url

    referer_scheme

    referer_netloc

    referer_path

    referer_query

    referer_fragment

    referer_hostname

    referer_port

    referer_dir_1

    referer_dir_2

    referer_dir_3

    referer_last_dir

    0

    -

    -

    nan

    nan

    -

    nan

    nan

    -

    1

    -

    -

    nan

    nan

    -

    nan

    nan

    -

    2

    http://adver.tools/

    http

    adver.tools

    /

    nan

    nan

    nan

    nan

    nan

    nan

    3

    -

    -

    nan

    nan

    -

    nan

    nan

    -

    4

    -

    -

    nan

    nan

    -

    nan

    nan

    -

    5

    -

    -

    nan

    nan

    -

    nan

    nan

    -

    6

    -

    -

    nan

    nan

    -

    nan

    nan

    -

    7

    -

    -

    nan

    nan

    -

    nan

    nan

    -

    8

    http://www.adver.tools/staging/urlytics/

    http

    www.adver.tools

    /staging/urlytics/

    nan

    nan

    staging

    urlytics

    nan

    urlytics

    9

    http://www.adver.tools/staging/urlytics/

    http

    www.adver.tools

    /staging/urlytics/

    nan

    nan

    staging

    urlytics

    nan

    urlytics

    Parse the user_agent column.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.regex.html b/docs/_build/html/advertools.regex.html index 08db1581..d751e004 100644 --- a/docs/_build/html/advertools.regex.html +++ b/docs/_build/html/advertools.regex.html @@ -161,7 +161,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.reverse_dns_lookup.html b/docs/_build/html/advertools.reverse_dns_lookup.html index 698f83e8..a0fc23a9 100644 --- a/docs/_build/html/advertools.reverse_dns_lookup.html +++ b/docs/_build/html/advertools.reverse_dns_lookup.html @@ -382,7 +382,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.robotstxt.html b/docs/_build/html/advertools.robotstxt.html index 9aa274dc..0a3f43a5 100644 --- a/docs/_build/html/advertools.robotstxt.html +++ b/docs/_build/html/advertools.robotstxt.html @@ -955,7 +955,7 @@

    robots.txt Testing Approach -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.serp.html b/docs/_build/html/advertools.serp.html index b3b4e503..58860852 100644 --- a/docs/_build/html/advertools.serp.html +++ b/docs/_build/html/advertools.serp.html @@ -665,7 +665,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.sitemaps.html b/docs/_build/html/advertools.sitemaps.html index 93839707..376cee2f 100644 --- a/docs/_build/html/advertools.sitemaps.html +++ b/docs/_build/html/advertools.sitemaps.html @@ -1182,7 +1182,7 @@

    Video Sitemaps -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.spider.html b/docs/_build/html/advertools.spider.html index 5f7dc38f..0488aa85 100644 --- a/docs/_build/html/advertools.spider.html +++ b/docs/_build/html/advertools.spider.html @@ -678,7 +678,7 @@

    Spider Custom Settings and Additional Functionality
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with
    Sphinx using a diff --git a/docs/_build/html/advertools.stopwords.html b/docs/_build/html/advertools.stopwords.html index 07ed8ca5..4899bb0e 100644 --- a/docs/_build/html/advertools.stopwords.html +++ b/docs/_build/html/advertools.stopwords.html @@ -228,7 +228,7 @@

    Stopword Languages -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.twitter.html b/docs/_build/html/advertools.twitter.html index 096b8995..4ae850d8 100644 --- a/docs/_build/html/advertools.twitter.html +++ b/docs/_build/html/advertools.twitter.html @@ -1083,7 +1083,7 @@

    Functions -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.url_builders.html b/docs/_build/html/advertools.url_builders.html index ec1cc297..9120d2a2 100644 --- a/docs/_build/html/advertools.url_builders.html +++ b/docs/_build/html/advertools.url_builders.html @@ -181,7 +181,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.urlytics.html b/docs/_build/html/advertools.urlytics.html index ffcf5442..4a275967 100644 --- a/docs/_build/html/advertools.urlytics.html +++ b/docs/_build/html/advertools.urlytics.html @@ -140,11 +140,13 @@

    The main function here is url_to_df(), which as the name suggests, converts URLs to DataFrames.

    -
    >>> urls = ['https://netloc.com/path_1/path_2?price=10&color=blue#frag_1',
    -...         'https://netloc.com/path_1/path_2?price=15&color=red#frag_2',
    -...         'https://netloc.com/path_1/path_2/path_3?size=sm&color=blue#frag_1',
    -...         'https://netloc.com/path_1?price=10&color=blue']
    ->>> url_to_df(urls)
    +
    import advertools as adv
    +
    +urls = ['https://netloc.com/path_1/path_2?price=10&color=blue#frag_1',
    +        'https://netloc.com/path_1/path_2?price=15&color=red#frag_2',
    +        'https://netloc.com/path_1/path_2/path_3?size=sm&color=blue#frag_1',
    +        'https://netloc.com/path_1?price=10&color=blue']
    +adv.url_to_df(urls)
     
    @@ -244,6 +246,8 @@
    +

    ِA more elaborate exmaple on how to analyze URLs shows how you +might use this function after obtaining a set of URLs.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.word_frequency.html b/docs/_build/html/advertools.word_frequency.html index b56fc97a..a293c95d 100644 --- a/docs/_build/html/advertools.word_frequency.html +++ b/docs/_build/html/advertools.word_frequency.html @@ -379,7 +379,7 @@

    Absolute vs Weighted Frequency -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.word_tokenize.html b/docs/_build/html/advertools.word_tokenize.html index a5ef3eda..21190c4f 100644 --- a/docs/_build/html/advertools.word_tokenize.html +++ b/docs/_build/html/advertools.word_tokenize.html @@ -208,7 +208,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/advertools.youtube.html b/docs/_build/html/advertools.youtube.html index adc22139..3046fc5e 100644 --- a/docs/_build/html/advertools.youtube.html +++ b/docs/_build/html/advertools.youtube.html @@ -1324,7 +1324,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/genindex.html b/docs/_build/html/genindex.html index 5fc8f5e2..a262beca 100644 --- a/docs/_build/html/genindex.html +++ b/docs/_build/html/genindex.html @@ -703,7 +703,7 @@

    Y


    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/include_changelog.html b/docs/_build/html/include_changelog.html index 5bd4cf50..cfa443a0 100644 --- a/docs/_build/html/include_changelog.html +++ b/docs/_build/html/include_changelog.html @@ -178,6 +178,13 @@

    advertoolsExtract structured entities from text lists
  • 🕷 Python Status Code Checker with Response Headers
  • @@ -987,7 +994,7 @@

    0.1.0 (2018-07-02) -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/index.html b/docs/_build/html/index.html index b72f4ad1..5f97aa8a 100644 --- a/docs/_build/html/index.html +++ b/docs/_build/html/index.html @@ -259,6 +259,13 @@

    Online marketing productivity and analysis toolsExtract Structured Entities from Text
  • Stop Words
  • Built with Sphinx using a diff --git a/docs/_build/html/modules.html b/docs/_build/html/modules.html index 6acda574..1192b3f8 100644 --- a/docs/_build/html/modules.html +++ b/docs/_build/html/modules.html @@ -139,6 +139,13 @@

    advertoolsExtract structured entities from text lists
  • 🕷 Python Status Code Checker with Response Headers
  • @@ -237,7 +244,7 @@

    advertools -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/py-modindex.html b/docs/_build/html/py-modindex.html index f0a80ddc..1711f4aa 100644 --- a/docs/_build/html/py-modindex.html +++ b/docs/_build/html/py-modindex.html @@ -254,7 +254,7 @@

    Python Module Index


    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/readme.html b/docs/_build/html/readme.html index 0ae48666..593dedf6 100644 --- a/docs/_build/html/readme.html +++ b/docs/_build/html/readme.html @@ -345,7 +345,7 @@

    Conventions -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/search.html b/docs/_build/html/search.html index 56f2cce8..1d9bfcab 100644 --- a/docs/_build/html/search.html +++ b/docs/_build/html/search.html @@ -132,7 +132,7 @@
    -

    © Copyright 2021, Elias Dabbas.

    +

    © Copyright 2022, Elias Dabbas.

    Built with Sphinx using a diff --git a/docs/_build/html/searchindex.js b/docs/_build/html/searchindex.js index 842722f6..ada5b414 100644 --- a/docs/_build/html/searchindex.js +++ b/docs/_build/html/searchindex.js @@ -1 +1 @@ -Search.setIndex({docnames:["advertools","advertools.ad_create","advertools.ad_from_string","advertools.code_recipes","advertools.code_recipes.spider_strategies","advertools.emoji","advertools.extract","advertools.header_spider","advertools.knowledge_graph","advertools.kw_generate","advertools.logs","advertools.regex","advertools.reverse_dns_lookup","advertools.robotstxt","advertools.serp","advertools.sitemaps","advertools.spider","advertools.stopwords","advertools.twitter","advertools.url_builders","advertools.urlytics","advertools.word_frequency","advertools.word_tokenize","advertools.youtube","include_changelog","index","modules","readme"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":4,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":3,"sphinx.domains.rst":2,"sphinx.domains.std":2,"sphinx.ext.viewcode":1,sphinx:56},filenames:["advertools.rst","advertools.ad_create.rst","advertools.ad_from_string.rst","advertools.code_recipes.rst","advertools.code_recipes.spider_strategies.rst","advertools.emoji.rst","advertools.extract.rst","advertools.header_spider.rst","advertools.knowledge_graph.rst","advertools.kw_generate.rst","advertools.logs.rst","advertools.regex.rst","advertools.reverse_dns_lookup.rst","advertools.robotstxt.rst","advertools.serp.rst","advertools.sitemaps.rst","advertools.spider.rst","advertools.stopwords.rst","advertools.twitter.rst","advertools.url_builders.rst","advertools.urlytics.rst","advertools.word_frequency.rst","advertools.word_tokenize.rst","advertools.youtube.rst","include_changelog.rst","index.rst","modules.rst","readme.rst"],objects:{"":[[0,0,0,"-","advertools"]],"advertools.ad_create":[[1,1,1,"","ad_create"]],"advertools.ad_from_string":[[2,1,1,"","ad_from_string"]],"advertools.code_recipes":[[4,0,0,"-","spider_strategies"]],"advertools.emoji":[[5,1,1,"","emoji_search"],[5,1,1,"","extract_emoji"]],"advertools.extract":[[6,1,1,"","extract"],[6,1,1,"","extract_currency"],[6,1,1,"","extract_exclamations"],[6,1,1,"","extract_hashtags"],[6,1,1,"","extract_intense_words"],[6,1,1,"","extract_mentions"],[6,1,1,"","extract_numbers"],[6,1,1,"","extract_questions"],[6,1,1,"","extract_urls"],[6,1,1,"","extract_words"]],"advertools.header_spider":[[7,2,1,"","HeadersSpider"],[7,1,1,"","crawl_headers"]],"advertools.header_spider.HeadersSpider":[[7,3,1,"","custom_settings"],[7,4,1,"","errback"],[7,3,1,"","name"],[7,4,1,"","parse"],[7,4,1,"","start_requests"]],"advertools.knowledge_graph":[[8,1,1,"","knowledge_graph"]],"advertools.kw_generate":[[9,1,1,"","kw_broad"],[9,1,1,"","kw_exact"],[9,1,1,"","kw_generate"],[9,1,1,"","kw_modified"],[9,1,1,"","kw_neg_broad"],[9,1,1,"","kw_neg_exact"],[9,1,1,"","kw_neg_phrase"],[9,1,1,"","kw_phrase"]],"advertools.logs":[[10,1,1,"","crawllogs_to_df"],[10,1,1,"","logs_to_df"]],"advertools.reverse_dns_lookup":[[12,1,1,"","reverse_dns_lookup"]],"advertools.robotstxt":[[13,1,1,"","robotstxt_test"],[13,1,1,"","robotstxt_to_df"]],"advertools.serp":[[14,1,1,"","serp_goog"],[14,1,1,"","serp_youtube"],[14,1,1,"","set_logging_level"],[14,1,1,"","youtube_channel_details"],[14,1,1,"","youtube_video_details"]],"advertools.sitemaps":[[15,1,1,"","sitemap_to_df"]],"advertools.spider":[[16,1,1,"","crawl"]],"advertools.twitter":[[18,1,1,"","authenticate"],[18,1,1,"","get_application_rate_limit_status"],[18,1,1,"","get_available_trends"],[18,1,1,"","get_favorites"],[18,1,1,"","get_followers_ids"],[18,1,1,"","get_followers_list"],[18,1,1,"","get_friends_ids"],[18,1,1,"","get_friends_list"],[18,1,1,"","get_home_timeline"],[18,1,1,"","get_list_members"],[18,1,1,"","get_list_memberships"],[18,1,1,"","get_list_statuses"],[18,1,1,"","get_list_subscribers"],[18,1,1,"","get_list_subscriptions"],[18,1,1,"","get_mentions_timeline"],[18,1,1,"","get_place_trends"],[18,1,1,"","get_retweeters_ids"],[18,1,1,"","get_retweets"],[18,1,1,"","get_supported_languages"],[18,1,1,"","get_user_timeline"],[18,1,1,"","lookup_status"],[18,1,1,"","lookup_user"],[18,1,1,"","make_dataframe"],[18,1,1,"","retweeted_of_me"],[18,1,1,"","search"],[18,1,1,"","search_users"],[18,1,1,"","set_auth_params"],[18,1,1,"","show_lists"],[18,1,1,"","show_owned_lists"]],"advertools.url_builders":[[19,1,1,"","url_utm_ga"]],"advertools.urlytics":[[20,1,1,"","url_to_df"]],"advertools.word_frequency":[[21,1,1,"","word_frequency"]],"advertools.word_tokenize":[[22,1,1,"","word_tokenize"]],"advertools.youtube":[[23,1,1,"","activities_list"],[23,1,1,"","captions_list"],[23,1,1,"","channel_sections_list"],[23,1,1,"","channels_list"],[23,1,1,"","comment_threads_list"],[23,1,1,"","comments_list"],[23,1,1,"","guide_categories_list"],[23,1,1,"","i18n_languages_list"],[23,1,1,"","i18n_regions_list"],[23,1,1,"","playlist_items_list"],[23,1,1,"","playlists_list"],[23,1,1,"","search"],[23,1,1,"","subscriptions_list"],[23,1,1,"","video_categories_list"],[23,1,1,"","videos_list"]],advertools:[[1,0,0,"-","ad_create"],[2,0,0,"-","ad_from_string"],[3,0,0,"-","code_recipes"],[5,0,0,"-","emoji"],[6,0,0,"-","extract"],[7,0,0,"-","header_spider"],[8,0,0,"-","knowledge_graph"],[9,0,0,"-","kw_generate"],[10,0,0,"-","logs"],[11,0,0,"-","regex"],[12,0,0,"-","reverse_dns_lookup"],[13,0,0,"-","robotstxt"],[14,0,0,"-","serp"],[15,0,0,"-","sitemaps"],[16,0,0,"-","spider"],[17,0,0,"-","stopwords"],[18,0,0,"-","twitter"],[19,0,0,"-","url_builders"],[20,0,0,"-","urlytics"],[21,0,0,"-","word_frequency"],[22,0,0,"-","word_tokenize"],[23,0,0,"-","youtube"]]},objnames:{"0":["py","module","Python module"],"1":["py","function","Python function"],"2":["py","class","Python class"],"3":["py","attribute","Python attribute"],"4":["py","method","Python method"]},objtypes:{"0":"py:module","1":"py:function","2":"py:class","3":"py:attribute","4":"py:method"},terms:{"0":[4,5,6,7,8,9,10,11,12,13,14,15,16,20,21,23,25],"00":[10,13,14,15,23],"000":[14,18,22],"0000":10,"000000":21,"000b":16,"0039":16,"0043":16,"004a":16,"006f":16,"00954418":10,"00987329":10,"00a1":16,"00bf":16,"00c2":16,"00ce":16,"00e6":16,"00z":[14,15,23],"01":[13,14,15,23,25],"0126707":10,"0129998":10,"0133289":10,"0185947":10,"018jz":23,"018w8":23,"019582":10,"019_rr":23,"01a2":16,"01cgz":23,"01h6rj":23,"01h7lh":23,"01k8wb":23,"01lyv":23,"01sjng":23,"01t00":[14,23],"02":[7,13,15,25],"0213921":10,"021bp2":23,"022dc6":23,"024":[15,24],"024x1":24,"0253415":10,"025zzc":23,"0270483":7,"0271282":7,"027x7n":23,"0281389":10,"028sqc":23,"029949":10,"02d86a3cea00007e9edb0cf2000000":16,"02d86a3e0e00007e9edb0d72000000":16,"02d86a3e1300007ec2a808a2000000":16,"02d86a3e140000d437b81532000000":16,"02d86a3e150000d423322742000000":16,"02d86a494f0000d437b828b2000000":16,"02d86a4a7f00007e9edb13a2000000":16,"02d86a4a7f00007ec2a811f2000000":16,"02d86a4a7f0000d423209db2000000":16,"02d86a4a7f0000d423323b42000000":16,"02hygl":23,"02jjt":23,"02lkt":23,"02mscn":23,"02ntfj":23,"02vx4":23,"02vxn":23,"02wbm":23,"03":[13,15,25],"0315945":10,"032tl":23,"037hz":23,"03_d0":23,"03c3":16,"03glg":23,"03hf_rm":23,"03t17":15,"03tmr":23,"04":[7,15,25],"0403l3g":23,"0410tth":23,"041xxh":23,"0477209":10,"04q1x3q":23,"04rlf":23,"05":[15,16,25],"05qjc":23,"05qt0":23,"05rwpb":23,"06":[15,25],"06442":7,"064t9":23,"066667":21,"066wd":23,"068hy":23,"06bvp":23,"06by7":23,"06cqb":23,"06j6l":23,"06ntj":23,"07":[13,15,25],"0701004":10,"0710e93d610dd8c3":7,"0774069":15,"07_53":23,"07bs0":23,"07bxq":23,"07c1v":23,"07yv9":23,"08":[13,15,25],"08427":[14,23],"087985":13,"08t17":15,"09":[13,15,16,25],"090302_gazaconferenciaml":15,"090409_machienhuu_revisit":15,"090421_mqm_speaks_rza":15,"090524_paquistaoupdateg":15,"090618_tomtest":15,"090620_as_iraq_explosion_tc2":15,"090620_iraq_blast_tc2":15,"090622_me_egypt_us_tc2":15,"090622_me_worldbank_tc2":15,"090623_egitomilitaresfn":15,"090623_iz_cairo_russia_tc2":15,"090623_mz_leaders_lifespan_tc2":15,"090624_me_inpictures_brazil_tc2":15,"090624_mz_wimbledon_tc2":15,"090625_sf_tamim_verdict_tc2":15,"090628_rn_pakistani_soldiries_ambush":15,"090629_om_pakistan_report_tc2":15,"090715_hillary_iran_cq":15,"090723_ae_silwan_tc2":15,"090729_iraquerefenbritsfn":15,"090830_ugc_ddh_sand":15,"090831_dalailamataiwan":15,"090901_japecontask":15,"090901_putin_regret_pact":15,"090901_tiananmen_movi":15,"098wr":23,"09kqc":23,"09s1f":23,"09t13":15,"09t15":15,"09xp_":23,"0b1vjn":23,"0bzvm2":23,"0c79465a9793low":15,"0cff645fbb74c21791568b78a888967d":15,"0d790f23c36dlow":15,"0f2f9":23,"0g293":23,"0ggq0m":23,"0glt670":23,"0gywn":23,"0jm_":23,"0kt51":23,"1":[1,4,5,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,25],"10":[2,5,7,10,13,14,15,16,18,20,21,25],"100":[4,10,14,16,18,21],"1000":[14,23],"10000ft":[14,23],"101":10,"101e":16,"103":10,"104":16,"105":10,"108":13,"1080p":[14,23],"1083":7,"109":10,"1090":10,"1095":10,"10968":15,"10t17":15,"11":[5,7,10,13,14,15,16,25],"110":10,"111111":21,"113":10,"117821":10,"118":10,"118614":7,"119":10,"11e1":15,"11t17":15,"12":[10,13,15,16,18,25],"1204":15,"1210":10,"122":[14,23],"123":6,"124":27,"125":[2,12],"1261":10,"1274":15,"1285":15,"129":10,"1293":15,"13":[2,5,7,8,10,13,15,25],"130":[2,10,12,15],"1306":8,"131k":27,"132":10,"13251":8,"13270":7,"133333":21,"135":10,"1350":15,"137":10,"13c3":16,"14":[8,10,13,15,25],"140":18,"14022":15,"1415":10,"143":10,"1435":8,"146":[10,13],"147":13,"148":13,"149":13,"149416":10,"14c904a172315a4922f4d28948b916c2":7,"15":[2,8,10,15,20,23],"150":13,"1500m":[14,23],"1506":15,"1509":8,"152":10,"1534":15,"154":10,"154258":10,"1545":10,"1555":15,"1585538956622":15,"1585539039190":15,"1585539054298":15,"1585539172701":15,"1585539206866":15,"1585539237156":15,"1585539358901":15,"1585539536519":15,"16":[4,10,13,15],"163":10,"164":10,"1647":16,"1657":15,"1664":10,"1677":15,"17":[7,10,13,15,16,25],"170":[7,16],"171":10,"173":10,"174":10,"176":10,"177":10,"1777":10,"179":10,"179365":10,"18":[7,10,15,25],"180":[7,16],"182":10,"184":15,"185":[10,12],"1858":10,"18c3":16,"19":[7,13,16,25],"191":8,"19142":8,"192":10,"1937":10,"194":[10,12],"1959":15,"196":10,"1970":[14,23],"1d9b91664204low":15,"1f1ee":5,"1f1f8":5,"1f32d":5,"1f33d":5,"1f340":5,"1f346":5,"1f3e9":5,"1f3fb":5,"1f3fc":5,"1f3fd":5,"1f3fe":5,"1f3ff":5,"1f415":5,"1f436":5,"1f48c":5,"1f499":5,"1f4d8":5,"1f535":5,"1f537":5,"1f539":5,"1f7e6":5,"1f91f":5,"1f94a":5,"1f951":5,"1f954":5,"1f955":5,"1f9ae":5,"1f9ba":5,"1f9e4":5,"1fad0":5,"1mb":15,"1winner":15,"2":[4,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,25],"20":[1,6,8,10,13,14,15,16,18,21,23,24],"200":[7,10,16,18,21],"200000":21,"200689":13,"2008":15,"2009":[15,16],"200d":5,"2010":15,"2011":15,"2012":15,"2013":15,"2014":[10,15],"2015":[15,17,18],"2016":[15,17],"2017":[15,23],"2018":[15,25],"2019":[15,25],"201e":16,"202":16,"2020":[13,15,16,25],"2021":[13,15,25],"2022":[7,10,13,15,25],"203":[8,10],"203191":8,"2074":10,"207504":10,"209":10,"20pct_off":19,"21":[10,13,14,15,16,18,19,25],"2103":15,"211":[10,12],"2132":10,"214":10,"217":10,"2190":10,"22":[10,13,15],"222222":21,"223":10,"2240":10,"225":10,"226":10,"2287":15,"23":[10,13,15,16,25],"232845":10,"234":10,"237":10,"24":[13,15],"241":10,"243":[10,12],"244":10,"249":[10,12],"24c3":16,"25":[2,6,12,15,16,19,25],"250":21,"252":8,"254237":10,"2547":10,"26":[1,7,10,16,19,25],"266667":21,"26837":7,"27":[7,13,15,23,25],"270":2,"273819":10,"2769":15,"27t17":15,"28":[1,13],"283":13,"284":13,"285":13,"286":13,"287":13,"289":13,"29":[7,10,15,25],"290":[10,13],"291":13,"2910":15,"292":[13,15],"292414":10,"293":13,"2950":15,"2951":15,"2952":15,"2953":15,"2954":15,"2955":15,"2984":15,"2ad504a1":16,"2anam":19,"2d":[14,23],"2e3b74":16,"2e454f":16,"2e494d":16,"2e4ccb":16,"2e77d2":16,"2e93a0":16,"2ed585":16,"2ef5ef":16,"2f1d9f":16,"2f6d5c":16,"2nd":11,"3":[4,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,25],"30":[1,2,10,13,14,15,25],"300":21,"301":16,"302":[7,16],"3021":15,"305743":10,"31":[10,12,15,25],"3153":15,"31536000":[7,16],"316":8,"3166":[14,23],"318743":10,"32":[7,10,13,15,16],"321":8,"3250":15,"33":[8,13],"3313":8,"331414":10,"333":6,"333333":21,"3339":[14,23],"3395":8,"34":8,"341287":10,"34be9bf74f00low":15,"34c3":16,"35":[8,10,16],"350831":10,"3561":15,"3587":8,"36":[10,13,16],"3600":16,"360375":10,"3682":15,"37":[14,15,23],"373":15,"375":12,"375724":13,"38":[10,16],"39":[10,12,13,15,16],"39687acb":15,"397":13,"398":13,"399":13,"3d":[14,23],"3f44":16,"3k":27,"4":[5,6,8,9,10,12,13,15,16,18,20,21,23,25],"40":[13,14,16],"400":[4,13,21],"401":13,"404":[10,16],"4044":10,"41":15,"41b0":15,"42":10,"4224":15,"42307":[14,23],"426":10,"4281":15,"43":15,"4312":8,"44":[10,13],"443":7,"4430":10,"444":6,"45":[10,14],"450":14,"456":6,"46":[10,15],"461037":15,"461815":13,"462":8,"466e":15,"468588":13,"47":10,"474456":13,"4758":10,"47603":15,"48":[10,13,15],"4883":15,"488ed635":15,"49":[8,10],"491":15,"49462":8,"499":10,"49994":15,"49995":15,"49996":15,"49997":15,"49998":15,"49999":15,"4c69":15,"4f34":15,"4f7bea3b":16,"4k":6,"5":[1,5,6,8,9,10,12,13,14,15,16,17,21,25],"50":[1,13,14,21,24],"500":[4,8,13,14,18,21,23],"5000":18,"501e":16,"5050":15,"5056":8,"505b":15,"5065":15,"5068":15,"5080":15,"5081":15,"5082":15,"5083":15,"5084":15,"5085":15,"51":[10,12,13],"510":15,"52":[13,15],"520":[10,15],"53":[8,10],"533":15,"536":13,"537":[10,13],"538":[13,27],"539":13,"54":[8,15],"540":13,"5403":15,"541":13,"545":15,"547":15,"55":[8,9,15],"554":15,"555":6,"556":15,"56":[9,10,12,13,15],"565":15,"57":[9,13,15],"576":8,"58":[9,10,13],"584":8,"59":9,"596daca7dbaa7e9":16,"596daca9b91fd437":16,"596daca9bcab7e9":16,"596daca9bddb7ec2":16,"596daca9bf26d423":16,"596dacbbb8afd437":16,"596dacbd980bd423":16,"596dacbd980cd423":16,"596dacbd99847ec2":16,"596dacbd9fb97e9":16,"5e":19,"5km":[14,23],"5x":10,"6":[5,6,8,10,12,13,15,21,25],"60":[10,12,13],"600000":21,"604800":[7,16],"619bd9be1d75db41adee6b58":15,"6201430a1d75db06ae1f62e8":15,"620345a15577c23d46622256":15,"6203cd7b5577c23d19622259":15,"62067f085577c277dd9acf42":15,"625":[9,12],"626":9,"627":9,"628":9,"629":9,"630":9,"63124":15,"632":15,"635":15,"638":15,"639":[8,14,18,23],"64":13,"640":15,"645":15,"6543":8,"66":[10,12,16],"6666666666666666":6,"6666666666666667":6,"666667":21,"67":16,"674":15,"68":[10,13,16],"683":15,"6853":8,"69":[10,16],"6dba2aae6b424107":7,"7":[5,8,10,12,13,15,18,21,25],"70":[10,16],"701e":16,"702814":13,"706":15,"716":10,"71756":8,"72":[10,13,23],"7200":7,"720a8581":16,"720p":[14,23],"727":15,"728x90":19,"729":10,"73":10,"74":12,"744247":15,"745":10,"75":[4,5,10,12,13,16],"7549":8,"755":15,"75911c9e":16,"75mi":[14,23],"76":13,"769":15,"77":[10,13],"78":13,"789":6,"79":[10,13],"7a28ef3b":16,"7c":[14,23],"7ec3":16,"8":[4,5,7,8,10,12,13,15,16,18,21,25],"80":[10,12,21],"800000":21,"801e":16,"81":10,"815":15,"8192":23,"82":16,"83":10,"841":15,"841851":15,"85855c48":16,"8601":23,"86199":15,"862":15,"86400":7,"872":15,"874":15,"875":12,"8760":8,"8808":15,"882":15,"888889":21,"89":10,"9":[5,7,8,10,13,15,16,21,25],"90":[2,10],"9044":15,"908":10,"90b11f47f8b2ab57cb180cbd3c6f06f9":15,"91":12,"913":15,"914107":15,"91d0":15,"92":10,"933333":21,"94":10,"94f1":15,"951053":13,"96":12,"97":12,"973":15,"98":10,"98b729fa":16,"99":15,"995323":15,"9cbd":15,"9dfdd38a":16,"9e64":15,"\u00e0":1,"\u03b5\u03af\u03c3\u03b1\u03b9":6,"\u03c0\u03ce\u03c2":6,"\u062a\u0630\u0647\u0628":6,"\u062d\u0627\u0644\u0643":6,"\u0643\u064a\u0641":6,"\u0644\u0627":6,"\u0645\u0631\u062d\u0628\u0627":6,"boolean":[8,14,16,23],"break":[15,18,24,27],"byte":[7,15,16,24],"c\u00f3mo":6,"case":[1,2,4,5,6,7,9,10,12,13,14,15,16,18,20,21,24,27],"char":1,"class":[7,16],"default":[2,4,6,8,9,10,14,15,16,18,21,22,23,24,27],"do":[0,2,3,7,9,10,12,13,14,15,16,18,20,21,23,25,27],"est\u00e1":6,"export":16,"final":[9,15,20,23,24],"float":[14,23],"function":[0,2,4,5,7,8,9,12,13,14,15,20,21,22,24,25,26,27],"haftungsbeschr\u00e4nkt":17,"import":[0,1,2,4,5,6,7,9,10,12,13,15,16,17,18,20,22,23,24,25,26,27],"int":[1,6,9,12,15,18,21],"long":[0,1,6,10,12,13,14,18,23,24,25,26,27],"new":[0,4,6,10,14,24,25,26,27],"null":18,"public":[5,7,16,18],"return":[1,2,5,6,7,8,9,10,12,13,14,15,18,19,20,21,22,23,24,27],"s\u00fcdkorea":8,"short":[2,14,21,23],"static":[10,13],"super":[7,10],"true":[1,2,4,6,7,9,10,13,14,15,16,18,20,21,23,24],"try":[10,13,14,16,21,23,27],"while":[0,3,10,14,18,20,21,23,24,25,26],A:[4,5,6,7,8,9,10,11,13,14,15,16,18,20,21,22,23,24,27],AND:14,And:[8,10],As:[1,4,12,13,15,20,21,22,23,27],At:[14,23],Being:7,But:[4,16,21],By:[10,14,16,21,23],For:[1,4,7,8,10,13,14,15,16,18,21,23],IS:[1,2],If:[2,4,6,7,8,10,14,15,16,18,20,21,23,24,25],In:[1,2,6,8,10,12,13,14,15,16,18,20,21,23,24,27],Is:[1,8,15],It:[4,6,7,8,9,10,12,14,15,16,18,20,21,23],NOT:[6,14,23],No:[6,14],Not:[5,18],ON:18,OR:[14,18,23,25,27],On:[0,2,18,24,25,26],One:[1,7,13,15,16,21],Or:[9,16,20],THE:19,That:[2,4,16,23],The:[0,2,4,5,6,7,8,9,10,12,13,14,15,16,18,21,22,23,24,25,26,27],Then:[16,18],There:[4,6,7,10,14,15,16,18,20,24,27],These:[4,10,16,21],To:[2,9,13,16,21,23,25],With:[7,15,18,21],_:15,__cfduid:16,__init__:24,_dash:10,_dict_product:24,_escaped_fragment_:13,_static:16,_to_df:27,a320:15,a850165d925db701988daf7ead7492d3:13,abbrevi:6,abil:[16,23,24],abl:[7,8,13,14],about:[2,4,5,6,7,10,12,13,14,15,16,18,20,21,23,24,25,27],abov:[4,8,16,18,20,21,24],abs_freq:[21,24],abs_perc:21,abs_perc_cum:21,abs_wtd_df:21,absolut:[0,12,13,20,24,25,26,27],accept:[7,14,16,23,24],access:[10,13,14,17,18,23,27],access_log:10,access_token:18,accid:4,accomplish:[21,27],accord:[13,22],account:[0,9,13,14,18,21,23,24,25,26],achiev:[4,22,27],across:[4,5,8,14,15,20,21,27],act:[14,23],action:[23,24],activ:[5,8,14,15,23],activities_list:23,actress:8,actriz:8,actual:[8,12,15,16,20,21,23],ad:[0,9,16,18,19,23,24,25,26,27],ad_:[16,27],ad_creat:[1,9,16,24,27],ad_from_str:[2,9,16,24,27],add:[4,7,10,16,21],add_prefix:10,addit:[0,2,6,10,12,14,18,21,23,24,25,26,27],addition:[16,18],addr:[10,12],address:[10,12,16,24,27],addressse:14,adgroup:9,administrativearea:8,adress:[10,12],adv:[1,2,4,5,6,7,9,10,12,13,15,16,17,18,21],adv_error:10,adv_log:10,adv_logs_fin:10,advantag:10,adventur:23,adver:[7,10,16],advertoo:16,advertool:[1,2,4,5,6,7,9,10,12,13,15,16,17,18],afaa7cb5e636low:15,affect:16,afghan:15,afghanistan:15,after:[2,4,6,14,15,16,18,20,21,22,23,27],afterward:21,ag:[7,16],again:[4,10,15,16,21],against:[8,18,21],agent:[0,3,7,10,12,16,24,25,26,27],aggreg:8,ahrefsbot:10,ai:15,aid:5,ajax:13,alert:7,algarv:1,algorithm:27,alias:8,aliaslist:[10,12],align:20,all:[2,4,5,6,7,8,9,10,13,14,15,16,18,20,21,23,24,27],allow:[1,2,7,10,13,14,16,18,23,24,27],allowed_domain:[4,16],allthreadsrelatedtochannelid:23,almost:[10,21],alon:21,along:[6,18,21],alpha:[14,23],alphabet:[8,14,23],alreadi:[4,21],also:[1,2,4,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,24,27],alt:[16,18,24],alt_href:[4,16],alt_hreflang:[4,16],altern:[4,13,16,24],although:[2,16,21],altogeth:10,alwai:[2,18,21],am:[5,21],amazon:[13,15,18],america:23,america_latina:15,american:23,among:21,amongst:21,amount:[16,21],amp:15,amplifi:18,amz:7,an:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,18,21,22,23,24,25,27],analysi:[0,6,7,12,15,16,18,24,26],analyt:[0,20,21,24,25],analyz:[0,7,14,16,17,18,21,24,25,26,27],anchor:[4,16],anderson:15,android:[10,15],ani:[2,4,5,6,8,9,10,13,14,15,16,18,20,21,22,23,24,27],anim:5,annot:11,anonym:10,anoth:[2,7,9,10,15,20,21,22],anotherexampl:16,anotherexmapl:16,answer:15,anyhow:21,anymor:24,anyon:21,anyth:[4,18,21,24],anywai:[9,21],anywher:[18,21],apache_error:10,api:[0,14,24,25,26,27],api_vers:18,app:[13,14,18,23],app_kei:18,app_secret:18,appear:[14,15,16,18,21,24],append:[2,13,14,16],appl:[13,21],applebot:13,applewebkit:10,appli:[13,14,15,16],applic:[7,8,10,14,16,18,23],appliedprivaci:10,approach:[0,9,20,21,24,25,26,27],appropri:23,ar:[2,4,6,7,8,9,10,13,14,15,16,18,20,21,22,23,24,25,27],arab:[6,14,15,17,24],arbitrari:[6,18,24],archiv:15,area:[14,23,27],aren:9,arg:7,argument:[4,8,14,16,24],armenian:6,around:[5,6,21],arpa:[10,12],art:23,articl:[0,15,20,24,25,26,27],articlebodi:8,articlelarg:15,artilc:20,asia:23,ask:[6,14,18,24],associ:[14,21,23],assum:[14,16,18,24],assur:7,astronaut:18,attach:[14,18,23],attack:15,attempt:16,attent:12,attitud:18,attr:16,attract:23,attribut:[4,14,16,18,21,24],au:14,audit:[0,3,13,15,16,25],auditdetail:23,australia:14,auth_endpoint:18,auth_param:18,authent:[0,12,14,23,24,25,26],author:[14,16,18,20,23],author_url:16,autocomplet:[15,27],autom:[4,7,13,27],automat:[0,3,14,23,25,27],avail:[2,4,7,8,10,11,14,15,16,17,18,20,21,23,24,27],avocado:5,avoid:20,aw:15,await:23,axi:10,azerbaijani:[17,24],b023:15,b0aef497:16,b935:15,b:[6,7,10],bY:2,back:[10,18,21,27],backend:[7,16],bad:24,bag:21,baiduspid:[10,13],ban:4,banana:21,bandwidth:7,banner:19,barcelona:9,base:[0,2,3,5,7,11,14,16,18,21,23,24,25,27],basebal:23,basi:7,basic:[4,7,9,12,15,20,27],basketbal:[5,23],batteri:4,bbc:[13,15],bbc_sitemap:15,beacon:7,bearer:18,beat:21,beauti:23,becam:21,becaus:[8,10,12,13,16,18,20,21],becom:[2,10,16,20,21],been:[4,15,18,21,23],beer:18,befor:[4,6,14,16,18,21,23],beforehand:21,begin:[18,22,24],behalf:[14,23],behavior:[0,7,15,23,24,25,26,27],behaviour:16,behind:21,being:[14,15,16,18,20,21,23,24,27],belong:[8,12,15,18],below:[8,14,16,21,22,23],ben:15,benefit:[2,20,27],bengali:[17,24],benton:15,besid:21,best:[14,18,21],better:[4,15,16,18,20,24,27],between:[4,9,10,14,15,16,21,22,23,27],beyond:21,bid:19,big:[4,9,10],bill:[8,14],bing:8,bingbot:[10,13],bitcoin:6,black:[14,16,21],blob:16,block:[4,10,13,15,16],blockblob:16,blocked_url:10,blog:20,bloomberg:27,blown:21,blue:[5,6,14,20,21,23],blueberri:5,bmw:[1,9],boat:[14,23],bodi:[5,7,16,18,27],body_text:[16,24],book:[5,21],bool:[1,2,6,9,15,16,18,20,21],boost:14,bot:[10,12],both:[6,9,14,16,18,21,22,23,27],bottom:[9,21,27],bounc:[16,21],box:[5,13,15,23],brace:1,brand:[6,8,10,15],brandingset:23,broad:9,broadcast:[14,23],broken:18,brown:14,browser:8,bud:16,bug:[15,24],bui:[9,13],build:[5,7,10,27],builder:[0,24,25,26],built:27,bulgarian:14,bulk:[0,24,25,26],bunch:16,buscador:8,busi:[15,23],butt:15,c01e:16,c2coff:14,c:[4,7,17],c_fill:15,ca:[14,21],cach:[7,16],call:[1,14,15,16,18,20,21,24,27],camp:16,campaign:[0,1,19,24,25,26],campaign_nam:9,can:[0,2,3,5,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,24,25,27],can_fetch:13,cannot:[18,21],canon:[4,7,16,24],canonical_par:4,cantant:8,capit:[1,2,8,9],capitalize_adgroup:[9,24],captial:2,caption:[14,23,24],captions_list:23,captur:[15,27],car:1,card:[16,18,24],card_uri:18,care:13,career:[9,13],carrot:5,casual:23,cat:5,catalan:[14,17,24],categor:[10,20],categori:[1,14,15,20,23],categoryid:23,cater:10,caus:[18,24],cc_attribut:14,cc_noncommerci:14,cc_nonderiv:14,cc_publicdomain:14,cc_sharealik:14,cdn:7,celebr:15,center:[14,23],certain:[0,3,6,7,8,10,12,13,15,16,17,20,21,24,25],certainli:10,certif:9,cgi:7,chain:16,chanc:8,chang:[2,4,10,13,14,16,21,27],changefreq:15,channel:[14,23,24,27],channel_id:14,channel_sections_list:23,channelid:[14,23],channelplaylistvideo:23,channels_list:23,channelsect:23,channeltyp:[14,23],charact:[2,6,14,18,21,22,23,24],characterisit:10,charset:[4,7,16,24],chart:23,cheap:9,cheat:24,check:[4,6,7,8,9,10,12,13,14,15,16,21,27],checker:[0,24,25,26],child:23,china:15,chines:[14,17,23,24],choic:5,chokkattu:15,choos:[14,16,23],chose:10,chosen:10,christian:23,christma:15,chrome:[8,10],chronolog:[14,23],cinta:1,circl:5,circular:[14,23],citi:[1,8],claim:12,clarif:24,classic:23,classifi:23,clean:27,clear:[8,9,18],clearli:[9,20],click:27,client:10,client_arg:18,cline:15,clipart:14,close:4,closedcapt:[14,23],closespider_errorcount:[4,16],closespider_itemcount:[4,16],closespider_pagecount:[4,16],closespider_timeout:[4,16],cloth:5,cloudflar:[7,16],cloudfront:15,clover:5,club:[9,27],clue:13,cm:[14,23],cn:14,code:[0,4,5,6,8,10,14,15,16,18,19,23,24,25,26,27],code_recip:[0,24,25,26],codepoint:5,cohort:7,collect:[11,13,14,18,23,24],collin:15,collinss:15,colliss:20,color:[14,16,20,21],column:[4,7,8,9,10,13,14,15,16,18,20,21,24],com:[4,5,6,7,8,10,12,13,14,15,16,18,19,20,23],comand:12,combin:[8,9,10,11,13,14,16],come:[2,9,10,21],comma:[14,18,21,22,23],command:[4,10,12,13,25],comment:[13,16,23,24,27],comment_threads_list:23,comments_list:23,commentthread:23,commerc:[9,21],common:[7,10,14,23],common_with_vhost:10,commun:[4,20,27],compani:[6,8,13],compar:[15,20],comparison:[8,12],compat:[10,18],compil:11,complet:[6,9,14,18,20,21,23],complex:[10,18],complic:18,compon:[7,10,18,20,24],comprehens:27,compress:[10,24],comput:[4,10,16],concat:[10,16],concaten:15,concurr:[0,3,14,23,24,25],concurrent_item:4,concurrent_request:4,concurrent_requests_per_domain:[4,16],concurrent_requests_per_ip:4,condit:[0,3,10,16,25],conduct:13,confid:16,configur:[16,23],conform:10,conformig:10,conglomer:8,congression:15,conjunct:[14,18,23],connect:[4,13,18,24,27],consecut:[4,16],consid:[6,18,23],consider:[2,21,27],consist:[2,4,9,10,18,20,21,24],consol:[0,14,20,23,25],constrain:[14,23],consum:[7,18],consumed_onli:18,contaboserv:10,contain:[4,5,6,7,8,9,10,13,14,15,16,18,20,21,22,23,24,27],content:[4,7,8,13,14,15,16,17,20,21,23,24,26],contentdetail:23,contentownerdetail:23,contenturl:8,context:[6,8,11],continu:[7,27],contrast:6,contributornameid:16,control:[0,3,7,14,16,24,25,27],conveni:27,convert:[2,10,16,20,24,27],cookbook:11,cool:27,coordin:[14,23],copi:[0,3,25,27],copyright:[16,17],core:10,corn:5,coronaviru:15,corpor:8,corpu:21,correct:[6,8,24],correctli:2,correspond:15,cost:23,could:[7,14,21,23,24],count:[0,1,5,6,10,12,13,15,18,22,24,25,26,27],counti:15,countri:[5,14,16,20,23,24,27],countryau:14,countryuk:14,cours:[7,9,21],coverag:24,covid:15,cpu:10,cq:15,cr:14,crash:16,crawl:[0,3,7,12,13,20,24,25,26,27],crawl_df:[7,16],crawl_head:[7,24,27],crawl_logs_df:10,crawl_logs_to_df:10,crawl_tim:[7,16],crawler:[0,4,7,10,24,25,26,27],crawllogs_to_df:[10,24],creat:[0,4,5,7,8,9,14,18,20,23,24,25,26,27],creation:27,creativ:[14,23],creativecommon:[14,23],credenti:[8,14,18,23],credibl:18,cricket:23,criteria:23,criterion:9,critic:[8,14],croatian:[14,17,24],crossorigin:[16,24],crowd:14,cse:24,css:[0,4,24,25,26,27],css_link:4,css_selector:[16,24],csv:10,ct:[7,16],ctrl:4,cultur:15,cultura_sociedad:15,cum_count:[10,12],cum_perc:[10,12],cumul:[12,21],curat:23,currenc:[6,21,24,27],currency_summari:6,currency_symbol:6,currency_symbol_count:6,currency_symbol_freq:6,currency_symbol_nam:6,currency_symbols_flat:6,currency_symbols_per_post:6,current:[4,10,15,16,18,23,24,27],cursor:18,custom:[0,3,7,10,14,24,25,26,27],custom_set:[4,7,10,16,24],customiz:16,cutom_set:4,cx:14,czech:14,d4889b15:15,d74930cf:15,d76b68d148ddec1efd004:16,d9646265:10,d99f2368:16,d:[7,10,14],d_placeholder_thescen:15,dai:[4,14,18,23],danish:[14,17,24],dark:5,dash:[10,24],dash_html_compon:10,dashboard:[18,27],dashboardom:7,data:[0,6,7,9,13,14,15,20,24,25,26,27],databas:[5,6,10,11,24,27],datacamp:27,datafram:[0,5,9,13,14,15,16,18,20,21,24,25,26,27],dataset:[16,20,21,27],date:[10,13,14,15,16,18,23,24,27],daterestrict:14,datetim:[10,14,15,23,24],datetime64:15,david:15,db:24,dd:18,ddthh:23,de:[1,4,8,9,16],deal:27,death:15,debug:[10,14],debut:15,dec:15,decid:[15,16,18],decis:[7,15,27],decod:20,decrib:16,deep:16,default_request_head:16,defeat:15,defin:[8,10,14,21,23,24],definit:[14,23],deflat:[7,16],delai:13,delimit:[20,22],deliveri:27,demot:[14,23],denot:13,depend:[6,7,8,9,15],deprec:[23,24],depth:[0,3,7,16,25],depth_limit:[4,16],desc_text:2,descend:[14,23],describ:[9,21],descript:[0,4,6,8,9,16,18,20,21,23,24,25,26,27],design:[9,13],desir:[10,18],desktop:10,destin:[10,20],detail:[2,7,9,10,13,14,16,18,23,27],detaileddescript:8,detect:18,determin:[0,9,14,21,24,25,26],develop:[5,8,13,14,18,23],df:24,di:[0,3,25],diamond:5,dict:[7,10,16],dict_kei:[5,6,17],dictionari:[4,5,6,7,16,17,24],did:[6,15,21],didn:27,differ:[2,4,5,6,8,9,10,11,13,14,15,16,18,20,21,23,27],differenti:19,difficult:9,digit:[0,27],dimens:[14,23],dir_1:[15,20],dir_2:[15,20],dir_3:[15,20],dir_4:15,dir_5:15,dir_6:15,dir_7:15,direct:[7,13],directli:18,directori:[0,24,25,26],disabl:14,disabled0:14,disallow:[13,16],disambigu:18,discordbot:13,discount:9,discov:[4,10,16,20,27],discoveri:[0,24,25,26],discreet:18,diseas:15,disk:10,dislik:23,displai:[6,10,13,14,23],dist:18,distanc:[14,23],distinct:18,distinguish:[10,16],distort:20,district:15,divers:27,divid:[2,21],dn:[0,10,24,25,26],doc:[8,18],document:[7,8,14,16,18,21,24],documentaion:16,doe:[2,4,5,6,12,13,14,15,16,21,22,23,27],doen:10,doesn:[4,9,10,16,21],dog:5,dollar:[6,22],domain:[0,3,7,10,12,13,14,16,20,24,25],domin:14,don:[0,1,3,6,7,10,14,16,20,21,24,25,27],done:[4,7,9,10,14,15,20,21,27],dot:[21,22],dotbot:10,down:[0,3,9,10,21,24,25,26,27],downgrad:7,download:[0,4,7,13,16,20,23,24,25,26,27],download_d:[13,15,24],download_delai:[4,16],download_lat:[7,16],download_slot:[7,16],download_timeout:[7,16],download_timout:16,dp8hsntg6do36:15,dr:10,draggabl:[16,24],drink:5,drive:8,drop:24,drop_dupl:13,dtype:[8,10,13,15],dubai:1,due:[6,10,18,21,23],duplic:[4,12,14,16,18],durat:[14,23],dure:[14,21],dutch:[14,17,24],duti:15,dwgyu36up6iuz:15,dynam:[7,16],e01:16,e7e15811c65f406f89f89fe10aef29f5:15,e:[1,7,9,14,16,19,21,23,24],each:[1,2,5,6,8,9,10,11,12,13,14,15,16,17,18,20,21,22,23,24],ear:5,earliest:23,earth:18,easi:[7,9,15,20,24,27],easier:[4,6,9,16,18,20,24,25,27],easiest:15,easili:[2,7,10,13,15,17,18,20,27],ed:11,editor:15,educ:9,ee0djx6z511tgx88:7,effect:[10,18,20],effici:[7,10,12,16],effort:18,eggplant:5,eight:21,eighti:13,either:[6,9,10,14,15,18,21,23,24],elect:15,electron:23,element:[0,2,4,6,7,8,24,25,26,27],element_1:24,element_2:24,eleven:21,eli:16,eliasdabba:5,elig:8,eln:15,els:[2,8,18,21],elsewher:21,email:[8,19],emb:23,embed:[14,18,23],embedd:[14,23],embedhtml:23,emerg:4,emo:16,emoji:[0,6,16,21,24,25,26,27],emoji_:27,emoji_count:5,emoji_df:[5,24],emoji_entri:5,emoji_flat:5,emoji_flat_text:5,emoji_freq:5,emoji_per_post:5,emoji_raw:5,emoji_search:[5,24,27],emoji_summari:5,emoji_text:5,emot:5,empti:[2,4,5,6,20,21,24],en:[4,7,8,15,16,18,20,23],en_u:23,enabl:[8,14],encod:[7,16,18,19,20],encount:[10,20],encourag:18,end:[2,6,7,14,16,20,22,24,27],engag:18,engin:[0,7,8,9,10,13,15,24,25,26,27],english:[14,17,20,21,24],enhanc:20,enough:[2,9,14,21,23],ensur:[2,16],enter:[14,16],entertain:23,entir:[14,18],entire_words_onli:6,entiti:[0,8,13,15,18,24,25,26,27],entri:5,env:10,environ:18,episod:[14,23],equal:[10,18,20],equival:[12,16],errback:7,errno:[10,12],error:[1,4,10,12,14,16,23,24],errors_fil:10,es:[8,20],escap:[14,23],espada:1,especi:[2,4,9,13,15,21],essenti:[21,22,27],estonian:14,etag:[13,15,24],etaospid:13,etc:[4,5,6,8,9,10,11,14,15,16,17,20,21,22,24,27],eur:6,euro:6,european:27,evalu:8,even:[10,13,14,15,16,18,21,23,24],event:[10,14,15,20,23],eventtyp:[14,23],ever:[14,21],everi:[10,13,15,16,18,21,23,27],everyon:21,everyth:[8,18,21],everywher:21,exact:[4,9,18],exactli:[2,5,23],exactterm:14,exampl:[2,4,6,7,8,9,10,13,14,15,16,18,20,21,22,23,24,27],example_crawl_1:4,excalam:6,exce:[1,2],except:[4,18,20,21],exclam:[6,22],exclamation_mark:6,exclamation_mark_count:6,exclamation_mark_freq:6,exclamation_mark_nam:6,exclamation_marks_flat:6,exclamation_marks_per_post:6,exclamation_summari:6,exclamation_text:6,exclud:[9,14,16,18,20,23,24,27],exclude_repli:18,exclude_url_param:[16,24],exclude_url_regex:[16,24],excludeterm:14,exclus:[14,23],exec:13,exist:[5,6,9,10,18],exit:10,exmapl:[4,7,16,27],expand:24,expect:[5,7,16],expens:7,experi:21,explain:[15,27],explan:16,explanatori:20,explicitli:[14,18,20],explod:15,explor:[5,6,15,16,17,18],exploratori:[4,16],explosionai:17,exposur:15,express:[0,3,5,6,9,10,13,14,16,21,24,25,26,27],ext_alt_text:18,extend:[10,18],extens:[4,10,13,14,24],extern:[7,10],extra:[2,10,21],extra_info:21,extract:[0,3,10,13,20,24,25,26,27],extract_:[6,24,27],extract_curr:[6,24],extract_emoji:[5,6,24],extract_exclam:[6,24],extract_hashtag:[6,24],extract_intense_word:[6,24],extract_ment:[6,24],extract_numb:[6,24],extract_quest:[6,24],extract_url:[6,24],extract_word:[6,24],extrem:[4,7,9,16,27],ey:13,f53301c8286f9bf59ef297f0232dcfc1:15,f:10,face:[5,14],facebook:[0,13,19,21,24,25,26],facebookbot:10,facebookexternalhit:13,failur:7,fairli:20,fall:[8,14,18,23],fallback:1,fals:[1,2,4,6,9,10,13,15,16,18,20,21,24],famili:[10,18],familiar:15,fashion:23,fast:[7,12,24],faster:[15,24],fastest:15,fatal:15,favorit:[1,18,21],fb_robot:13,fb_test:13,fb_userag:13,fe546b9b:15,featur:[2,14,15,18,23,24,27],feb:[7,10],februari:[15,23],feed:[0,23,24,25,26],feel:[5,6,24],fetch:[13,16,24],few:[4,6,7,10,15,16,20,21,27],fewer:2,field:[10,14,23,24],fifteen:[9,21],fifti:21,figur:[13,16,18,27],file:[0,1,4,7,12,14,15,16,24,25,26,27],filedetail:23,filepath:16,filetyp:14,fill:14,filter:[10,14,15,18,20,23,24],filter_to_owned_list:18,find:[4,5,6,14,16,18,20,21,23,27],fine:16,finger:5,finish:4,finnish:[14,17,24],first:[2,4,6,8,13,14,15,16,18,20,21,22,23,24],fish:[14,23],fit:[2,23,24],five:[2,13,16,20,21],fix:[10,16,24],fl_progress:15,flag:5,flat:[5,6],flex:13,flexibl:16,flight:[14,18],fligt:14,float64:15,focu:[9,12,27],focus:14,folder:4,follow:[0,2,3,5,7,10,14,15,17,18,20,21,23,24,25,26,27],follow_link:[4,7,10,16,24],food:[5,23],footbal:[5,9,15,23,27],footer:[4,16,24],footer_links_href:4,footer_links_text:[4,16],footer_links_url:16,footnot:17,forc:18,forchannelid:23,forcontentown:[14,23],fordevelop:[14,23],form:[6,8,21],format:[0,1,2,7,9,11,13,14,16,18,23,24,25,26,27],former:21,formerli:21,formin:[14,23],forth:[14,18,23],forti:[21,27],forusernam:23,forward:7,found:[4,10,14,15,18],four:[5,13,14,16,20,21,23],fr:[8,14,16],fraction:16,frag_1:20,frag_2:20,fragment:[15,20],frame:9,franc:14,free:14,freebas:[14,23],freixo:1,french:[14,17,24],freq:15,frequenc:[0,5,6,12,24,25,27],frequent:21,fri:7,friend:18,from:[0,3,8,10,11,12,13,14,15,16,18,20,21,22,23,24,25,26,27],front:21,fruit:5,ft:[14,23],fucntion:6,full:[1,4,5,7,9,15,16,18,21,24,27],fulli:[5,6,18],func:18,funcion:8,further:[16,20,21],futur:[18,23],g:[1,7,14,16,19,23,24],g_face:15,gadget:2,gain:[15,25],galaxi:15,game:23,garda:12,gecko:10,gener:[0,6,10,13,16,19,20,21,23,24,25,26,27],genr:15,geocod:18,geograph:[14,23],geoloc:14,geometr:5,georgia:15,geotag:18,german:[14,17,24],gestur:5,get:[0,1,2,4,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,24,25,26,27],get_application_rate_limit_statu:18,get_available_trend:18,get_favorit:18,get_followers_id:18,get_followers_list:18,get_friends_id:18,get_friends_list:18,get_home_timelin:18,get_list_memb:18,get_list_membership:18,get_list_status:18,get_list_subscrib:18,get_list_subscript:18,get_mentions_timelin:18,get_place_trend:[18,24],get_retweet:18,get_retweeters_id:18,get_supported_languag:18,get_user_timelin:18,gideon:15,give:[4,7,9,12,14,16,18,20,21],given:[2,4,13,14,15,16,18,20,24],gl:14,global:[16,18,24],glove:5,gmail:8,gmbh:17,gmt:[7,16],go:[6,7,9,10,13,14,15,16,21,24],goe:[4,15],golf:23,good:[2,4,6,10,12,15,16,20],googl:[0,10,12,13,20,23,24,25,26,27],googlebot:[10,12,13],googletagmanag:4,googtwfb:13,got:16,gp:13,gr:10,grai:14,gram:[0,24,25,26],granular:16,graph:[0,16,24,25,26],graphic:9,grayscal:14,great:[1,16,20,27],greater:18,greek:[6,14,17,24],green:[6,14,21],grin:5,group:[2,5,6,9,13,24,27],groupbi:13,gtm:4,gtm_noscript:4,gtm_script:4,guarante:18,guid:[5,23],guide_categories_list:[23,24],guidecategori:23,guitar:9,gunicorn:7,gwnlj8m99yumucgdd6ytm:7,gx12:2,gz:[15,24],gzip:[7,16],h1:[4,16],h2:[4,16,24],h3:[4,7,16],h4:4,h5:4,h6:[4,16],h:[10,24],h_180:15,ha:[2,4,6,9,13,15,16,18,20,21,23,24,27],haaatttteee:6,had:[4,5,6,21],haiku:18,half:21,han:[14,23],hand:[5,8,9],handl:[4,10,12,13,14,18,24,27],handler:10,hant:[14,23],happen:[4,10,20],happi:[10,18],hard:[0,3,25],hash:20,hashtag:[6,11,13,18,21,24,27],hashtag_count:6,hashtag_freq:6,hashtag_raw:11,hashtag_summari:6,hashtags_flat:6,hashtags_per_post:6,hate:18,hauptstadt:8,have:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,24,27],hd:[14,23],he:[15,21],head:[5,7,9,10,13,15,16,24,25,27],header:[0,4,13,15,16,24,25,26,27],header_links_href:4,header_links_text:[4,16],header_links_url:16,headers_df:7,headers_spid:7,headersspid:7,headlin:27,health:[2,23],heart:5,hebrew:[14,17,24],height:[16,23,24],heldforreview:23,hello:[5,6,13,16],help:[4,6,7,10,12,14,15,16,18,20,22,24,27],helper:[5,22],henc:21,her:21,here:[2,5,6,7,9,10,14,15,16,20,21,27],hereaft:21,herebi:21,herein:21,hereupon:21,herself:21,heru80fdn:15,hi:[6,15,21],hidden:21,hierarchi:8,high:[4,8,14,15,16,23],higher:[8,14,15,23,24],highest:[14,23],highli:[14,16,23,27],highrang:14,hilari:18,him:21,himself:[15,21],hindi:[15,17,24],hip:23,hit:[0,3,7,16,25],hl:[14,23],ho:8,hobbi:23,hockei:23,hodgeman:15,hol:10,hola:6,home:[13,23],home_timelin:18,honnib:17,hood:7,hop:23,hope:27,hopefulli:27,hopewel:15,host:[10,12,14,24,27],host_df:[10,12],hostnam:[10,12,20],hot:5,hotel:[1,5,14],hour:[4,18],hous:15,how:[0,2,3,5,6,7,9,13,15,16,18,21,24,25,26,27],howev:[10,14,18,21,23],howsearchwork:13,hp:13,hq:14,href:[4,16,24],hreflang:[4,7,24],ht:16,hte:15,htm:10,html:[4,7,10,13,15,16,18,20,23,24],http:[4,5,6,7,8,10,13,15,16,18,20],httperror_allow_al:7,huge:14,hulu:15,humor:23,hundr:[7,16,21],hungarian:[14,17,24],hurri:4,hydrat:18,hyphen:2,i18n_languages_list:23,i18n_regions_list:23,i18nlanguag:23,i18nregion:23,i:[0,3,5,6,7,13,14,16,20,21,25,27],ia_archiv:13,ibmo9hrztai:7,ic:23,iceland:14,icon:14,id:[4,7,8,14,16,18,23],idea:[4,6,9,16,21,27],ideal:[13,20,21,27],ident:18,identifi:[14,16,18,20,23],ifram:4,iframe_src:4,ignor:21,imag:[7,8,10,13,14,15,16,18,24],image_loc:15,img:[16,24],img_:16,img_alt:16,img_src:16,imgcolortyp:14,imgdominantcolor:14,imgr:13,imgsiz:14,imgtyp:14,immedi:[13,18],implement:24,importantli:[10,20,27],improv:[14,21,24],inc:8,includ:[0,3,6,9,10,13,14,15,16,18,20,22,23,24,25,27],include_card_uri:18,include_ent:18,include_ext_alt_text:18,include_rt:18,include_url_param:[16,24],include_url_regex:[16,24],include_user_ent:18,includesubdo:16,includesubdomain:7,inclus:[14,23],inconsist:20,inde:21,independ:23,indepent:16,index:[0,7,8,10,14,16,18,24,26,27],india:15,indic:[4,7,13,14,16,18,20,23,24],individu:[14,23],indonesian:[14,17,24],industri:[13,14,15,27],infer:6,influenti:18,info:[10,14,24],inform:[5,7,8,10,12,14,15,18,20,21,23,24,27],inherit:8,initi:[4,8],input:[1,2],insensit:[5,24],insert:[1,20],insid:22,insight:[0,4,15,21,24,25,26,27],instagram:18,instal:25,instanc:[6,8],instant:[0,24,25,26],instead:[13,16,18,20,21,23,24],instruct:[13,14,23],int64:[10,13,15],intact:2,integ:[2,14,23],integr:9,intend:[14,18,23],intens:[6,24],intent:[9,27],interact:[15,18],interest:[6,7,8,9,10,13,15,16,21,25],interfac:[7,14,18],interior:18,intern:[7,14,15,16,18],internacion:15,internation:14,internet:15,interv:[4,27],interview:15,introductori:27,invalid:24,invert:6,inverview:15,investig:4,invideopromot:23,io:[7,16,18],iowa:15,ip:[10,12,14,16,24,27],ip_address:[10,12,16],ip_host_dict:10,ip_list:12,ipaddrlist:[10,12],ir88:15,ir:12,iran:15,iraq:15,irish:[17,24],ismap:[16,24],iso:[8,14,18,23],issu:[4,24,27],italian:[14,17,24],item:[4,9,14,16,18,20,23,24],item_a:16,item_b:16,iter:2,its:[0,1,3,5,7,8,9,10,15,16,18,20,21,23,25],itself:[10,16,20,21],iyl50:7,ja:18,janeiro:9,japanes:[14,17,24],java:10,javascript:4,jazz:23,jenni:6,ji:8,jin:8,jl:[4,7,10,13,16,24],job:[0,3,9,25,27],jobdir:4,john:6,join:16,jpeg:7,jpg:15,jpy:6,js:[4,10],js_script_src:4,js_script_text:4,json:[7,10,14,16,18,24],json_norm:[10,24],jsonld_1_:16,jsonld_:16,jsonld_error:24,jsonlin:[7,16],julian:15,jung:8,jungl:8,just:[2,5,10,14,16,18,21,27],k:[10,16,21],ka:15,kaggl:[5,27],kang:8,kansa:15,kazakh:[17,24],keep:[1,4,5,8,9,12,13,16,18,21,24,27],kei:[4,5,6,8,14,16,17,18,20,21,23,24],key_nam:6,keyword:[0,5,8,16,17,21,24,25,26,27],keywords_df:9,khtml:10,kill:4,kilomet:[14,18,23],kind:[7,16,24,27],kiwi:21,km:[14,18,23],know:[2,9,10,16,20,27],knowledg:[0,23,24,25,26],knowledge_graph:[8,24],known:[7,16,18,21,24,27],korea:8,korean:[8,14],kw_:[16,24,27],kw_broad:9,kw_df:9,kw_exact:9,kw_gener:[9,16,24,27],kw_modifi:9,kw_neg_broad:9,kw_neg_exact:9,kw_neg_phras:9,kw_phrase:9,kwarg:[6,7],l1:16,lab:15,label:9,lamborghini:1,land:[2,9,27],lang:[13,18],lang_:14,lang_ar:14,lang_bg:14,lang_c:14,lang_ca:14,lang_d:14,lang_da:14,lang_el:14,lang_en:14,lang_et:14,lang_fi:14,lang_fr:14,lang_hr:14,lang_hu:14,lang_i:14,lang_id:14,lang_it:14,lang_iw:14,lang_ja:14,lang_ko:14,lang_lt:14,lang_lv:14,lang_nl:14,lang_no:14,lang_pl:14,lang_pt:14,lang_ro:14,lang_ru:14,lang_sk:14,lang_sl:14,lang_sr:14,lang_sv:14,lang_tr:14,lang_zh:14,languag:[0,7,8,9,14,15,16,18,20,21,23,24,25,26,27],larg:[0,4,5,10,12,14,15,16,21,24,25,26,27],larger:[14,18,23],last:[1,2,6,13,15,16,20,21,24],last_dir:[15,20,24],lastmod:15,lat:18,latenc:7,later:[0,3,10,15,25],latest:[1,2,16,18],latin:23,latitud:[14,18,23],latter:21,latterli:21,latvian:14,layout:[10,23],ld:[7,16,24],lead:14,leaf:5,learn:[9,15,16,21,23],leas:16,least:[14,21,23],leav:[2,13],left:[4,6,23],left_char:6,len:2,lenght:24,length:[1,2,7,15,18,20,21,22],less:[14,16,18,21,23],let:[1,2,8,9,13,14,15,16,21,23],letter:[2,5,14,23],level:[4,10,14,16,18,20,23],level_or_nam:14,li:[16,24],licens:[8,14,23],life:25,lifestyl:23,light:[5,7],like:[5,6,7,8,9,10,12,14,15,16,18,21,23,24,27],likelyspam:23,limit:[1,2,8,13,14,16,18,23,27],line:[1,7,8,10,12,13,14,16,25],lineart:14,link:[0,3,6,7,14,15,18,20,23,24,25,26,27],link_rel_href:4,link_rel_rel:4,link_rel_stylesheet:4,linkedin:13,linkedinbot:[10,13],links_frag:24,links_href:16,links_nofollow:[16,24],links_text:[16,24],links_url:[16,24],linksit:14,linux:[10,24],lisbon:1,list:[0,1,2,3,5,7,8,9,10,12,13,14,15,17,18,20,21,22,23,24,25,26,27],list_id:18,liter:8,lithuanian:14,littl:[20,25,27],live:[14,23],livestreamingdetail:23,ll:[13,18,21],load:[10,16,24],loc:15,local:[14,18,23],locat:[14,15,18,20,23,27],locationradiu:[14,23],log:[0,3,12,14,15,16,23,26,27],log_error:10,log_field:10,log_fil:[4,10,16],log_format:10,logic:14,login:[10,13],logs_df:10,logs_file_path:10,logs_to_df:[0,24,25,26],lokal:8,lon:18,longdesc:[16,24],longer:[1,2,6,14,21,23,24],longitud:[14,18,23],look:[2,9,15,21],lookout:7,lookup:[0,10,18,24,25,26],lookup_statu:18,lookup_us:18,looooooovvvve:6,looooooveee:6,loop:[14,18,24],lose:13,lost:[2,4],lot:[2,7,10,15,20,27],love:[5,18,21],love_emoji:5,lower:16,lowest:[14,23],lowrang:14,lr:14,luxuri:9,m:[10,13,14,15,23],ma:[7,16],machin:15,made:[6,12,18,21],mai:[10,13,14,16,18,21,23],mail:12,main:[2,8,13,14,15,16,18,20,21,24,27],mainli:[4,9,12,13,21,22],mainten:7,major:[10,13,15,18,27],make:[0,1,2,3,6,7,9,10,12,13,14,15,16,18,20,21,24,25,27],make_datafram:18,mammal:5,manag:[4,7,14,18,23,27],managedbym:23,mango:21,mani:[1,2,4,5,6,8,9,10,12,13,14,15,16,18,20,21,23,27],manipul:27,manner:[8,20],manual:4,map:[6,8,9,16,18,27],march:15,mark:[6,18,20,21,22,24],market:[0,8,9,14,16,19,24],martial:23,masscan:10,massiv:[10,12],master:[4,7,16],match:[5,6,8,9,10,14,16,18,23,24],match_typ:9,matter:9,matthew:17,max:[7,16],max_column:10,max_id:18,max_len:[1,9],max_work:[12,15,24],maxheight:23,maxim:18,maximum:[1,2,8,9,12,14,15,16,18,23],maxresult:[14,23],maxwidth:23,mayb:[9,13],mb:24,mckinlei:15,mckinleyd:15,me:[21,22],mean:[6,7,8,9,10,13,14,16,18,20,21,27],meaning:[15,21],meanwhil:21,measur:[4,14,23,24],media:[5,6,10,16,17,18,20,21],medium:[5,14,19,23],meet:[14,23],mega:15,megabyt:27,member:18,membership:18,memori:[10,16],mention:[6,8,11,18,20,21,27],mention_count:6,mention_freq:6,mention_raw:11,mention_summari:6,mentions_flat:6,mentions_per_post:6,mentions_timelin:18,merced:1,merg:[14,16,18,24],messag:[10,24],meta:[4,7,14,16,18,20],meta_desc:[4,16],metadata:[14,18,23,24],metatag:7,method:[7,10,14,16,18,23,25,27],method_from:10,method_to:10,metric:21,mi:[14,18,23],middl:24,middleeast:15,middlewar:10,might:[2,4,5,6,7,9,10,13,14,15,16,20,21,23,25,27],mile:18,militari:23,miller:15,million:21,min:10,min_rep:6,mind:[4,5,8,16,18,27],mine:[17,21,22,23,27],mini:7,minnesota:15,minor:[10,24],minu:16,minut:[14,15,23],miss:[2,15,24],missouri:15,mistak:13,mix:[18,20,23],mj12bot:10,mm:[15,18,23],mmb29p:10,mobil:10,mode:[0,3,6,18,24,25,26],model:[2,10,15],model_a:16,model_b:16,moder:[14,23],moderationstatu:23,modifi:[5,6,7,9,13,15,16,17,18,21],modul:[1,16,21,24,25,26,27],monitor:27,mono:14,month:[14,15,18],more:[2,4,5,6,7,8,9,10,13,14,15,16,18,20,21,23,24,27],moreov:21,morn:6,most:[1,2,4,6,7,9,10,14,15,16,18,21,23,27],mostli:[4,16,20,21,27],mostpopular:23,motorsport:23,move:21,movi:[14,15,18,23],mozilla:[10,16],mp4:15,mpu:19,ms:[10,16],msg:24,msnbot:13,much:[15,16,21,24],multi:[12,14],multimedia:15,multin:8,multipl:[0,3,6,8,13,14,15,16,24,25,27],multipli:21,mundo:15,music:23,must:[10,14,18,21,23],my:[0,1,3,16,21,25],my_output_fil:16,myrat:23,myrecentsubscrib:23,myself:21,mysit:19,mystuff:13,mysubscrib:23,n:[0,24,25,26],na:[20,24],name:[1,4,5,6,7,8,9,10,12,13,14,15,16,18,19,20,21,23,24,27],name_1:16,name_2:16,nan:[7,8,10,15,16,20],narrow:23,nasa:18,nat:[13,15],natali:15,nativ:18,native_video:18,natur:5,nav:[4,16,24],nav_links_href:4,nav_links_text:[4,16],nav_links_url:16,naverbot:13,navig:18,ncov:15,nebraska:15,need:[1,2,4,6,7,8,9,10,12,13,14,16,18,21,27],neg:[6,9,18],neither:21,nepali:[17,24],nest:[18,23],net:[10,15],netloc:[15,20],network:[6,20],never:21,nevertheless:21,newest:[15,23],news_keyword:15,news_publ:15,news_publication_d:15,news_titl:15,next:[9,16,21,23,27],next_cursor:18,nextpagetoken:[14,23,24],nexu:10,nfl:15,nginx:[7,16],nginx_error:10,nh:15,nine:21,nl:10,nobodi:21,node:18,nofllow:16,nofollow:[16,24],noindex:7,non:[10,14,21,22,23,24,27],none:[2,5,6,7,8,10,13,14,16,18,19,21,23],noon:21,nor:21,normal:[10,17],norwegian:[14,17,24],nose:15,note:[2,6,8,14,16,18,20,21,23,27],notebook:27,noth:[6,21],notic:[6,13],noticia:15,notset:14,noun:9,now:[1,2,6,9,10,13,15,16,18,21,24],nowher:21,np:15,ns:[4,15],nt:[10,16],num:14,num_currency_symbol:6,num_emoji:5,num_exclamation_mark:6,num_hashtag:6,num_list:[21,24],num_ment:6,num_numb:6,num_post:[5,6],num_question_mark:6,num_url:6,num_word:6,number:[0,3,5,6,8,9,12,13,14,15,16,18,20,21,23,24,25,27],number_count:6,number_freq:6,number_of_emoji:5,number_of_hashtag:6,number_of_ment:6,number_of_numb:6,number_of_symbol:6,number_of_url:6,number_of_word:6,number_separ:6,number_summari:6,numbers_flat:6,numbers_per_post:6,numer:[18,23],nutch:10,nyt:15,nyt_new:15,nytim:15,nz:14,o:11,oauth_token:18,oauth_token_secret:18,oauth_vers:18,obama:15,obei:[0,3,10,25],obido:13,object:[5,6,8,10,15,16,18,23,27],obtain:[18,21],occur:[6,15,16,18,21,23,24],occurr:[6,21],odai:6,off:[4,14,21],offer:[9,18],often:21,og:[4,16,24],og_cont:4,og_prop:4,ohio:15,ok:7,older:18,oldest:18,omit:18,onbehalfofcontentown:[14,23],onbehalfofcontentownerchannel:23,onc:[2,4,8,9,10,14,15,16,18,20,21,23,25,27],one:[1,2,4,5,6,8,9,10,11,13,14,15,16,18,20,21,23,24,27],ones:[5,6,7,10,12,15,16,21],ongo:[14,23],onli:[0,1,3,6,7,10,11,13,14,15,16,18,19,21,23,24,25,27],onlin:[2,16],onto:21,open:[10,13,15,16,24],opengraph:[4,7],oper:[10,14,15,18,23,24],oppos:[9,20,24],opposit:6,opt:18,optim:[7,8],option:[2,4,6,7,9,10,13,14,16,17,18,20,21,22,23,24,27],orang:[14,21],order:[6,8,9,14,16,23],order_matt:9,org:[5,7,8],organ:8,origin:[4,10,14,16,20,24],orterm:14,other:[2,5,6,7,8,10,11,13,14,15,16,18,20,21,23,24,27],otherwis:[16,18,20,21],ottawa:15,ound:6,our:[2,10,18,21],ourselv:[10,21],out:[1,8,10,13,14,16,18,20,21,23,27],outpuf_fil:16,output:[7,10,16,18,24],output_fil:[4,7,10,13,16,24],outreach:27,outsid:[10,14,23],over:[4,7,15,16,18,21,24],overview:[2,5,6,12,15,27],overwrit:16,owen:15,own:[6,9,10,14,18,20,21,23,27],owner:[13,14,18,23],owner_id:18,owner_screen_nam:18,ownership:18,p:[16,24],packag:[16,17,24,25,26,27],page:[0,2,3,6,7,8,9,10,13,15,17,18,20,21,23,24,25,26,27],page_1:4,page_2:4,page_3:4,page_4:4,pagelet:13,pagemap:24,pagepostssectionpagelet:13,pagetoken:[14,23],pageview:[10,21],pagin:[24,27],pai:14,pair:18,pakistan:15,pam:15,pand:24,panda:[5,7,9,10,13,15,16,18,24],panel:14,paper:5,param:27,paramet:[0,1,2,4,5,6,7,8,9,10,12,13,14,15,18,19,21,22,23,24,25,26,27],parent:[4,23],parenthes:22,parentid:23,parmet:16,parquet:[10,24],pars:[0,7,16,24,25,26,27],parser:27,part:[6,9,12,14,17,20,21,22,23,27],parti:18,partial:5,particular:[13,14,15,23],particularli:[14,16],partner:[14,23],pass:[4,8,13,14,15,16,18,27],past:[14,27],patch:10,patch_minor:10,path:[0,4,7,10,13,15,16,24,25,26],path_1:20,path_2:20,path_3:20,patienc:13,pattern:[0,6,13,15,20,21,25],paus:[0,3,25],pd:[7,10,13,15,16],peopl:[5,6,8,18,21,27],per:[5,6,14,15,18,21,27],perc:[10,12],percentag:[12,21,24],perform:[10,12,14,15,16,23],perhap:21,period:7,periscop:18,permiss:13,permut:9,persian:[15,17,24],person:[8,14],perspect:[16,20,21],pet:23,petalbot:10,phone:6,photo:[14,18],php:13,phrase:[9,14,18,21,22,24],phrase_len:[21,22,24],physic:23,pic:18,pictur:[15,21],piec:7,pink:14,pinterest:13,pinterestbot:13,pip3:[25,27],pip:[25,27],pipe:[14,21,23],pipelin:12,place:[1,4,5,8,18,24],placehold:[24,27],plai:[5,8,14,15,23],plain:23,plaintext:23,plan:10,plant:5,platform:[2,21,27],playback:[14,23],player:23,playlist:[14,23,24],playlist_items_list:23,playlistid:23,playlistitem:23,playlists_list:23,pleas:[7,8,14,16,18,21,23],png:[7,15,16],podcast:15,point:[5,8,14,20,23],pointer:12,polici:7,polish:[14,17,24],polit:[4,18,23],pop:23,popul:20,popular:[10,18,23,27],port:20,porto:1,portug:1,portugues:[14,15,17,24],posicionamiento:8,posit:[6,8,14,18,23],possibl:[9,10,13,14,21,27],post:[5,6,17,18,20,21,25,27],posts2:6,potato:5,potent:13,potenti:[16,18],potteri:15,pound:6,povertydata:7,power:[6,7,16],ppc:21,ppp046177196171:10,ppp089047044105:10,practic:[4,10,12,16,27],pre:[0,10,21,24,25,26],preced:24,prefer:18,preferenti:18,prefix:[8,24],preload:7,premier:15,prepar:[0,5,15,24,25,26],prepend:[18,20],present:[14,18,24],presidenti:15,pressur:16,pretti:16,prevent:[18,24],previou:[20,23,24],previous_cursor:18,prevpagetoken:[14,23],prg:7,price:[9,16,20],print:[5,10,15,17,24],prioriti:15,probabl:[4,16,27],process:[4,7,10,12,15],processingdetail:23,produc:[1,10,14,15,27],product1:20,product2:16,product:[0,1,2,8,9,14,16,20,21,24],profession:23,profil:[13,18],program:18,programmat:14,prohibit:13,project:[7,8,14,16,23,27],promis:27,promo:15,promot:15,proper:27,properli:[9,10,14,15,20,23,24],properti:[4,14,16,23],protocol:7,prouc:14,provid:[1,2,4,6,9,10,12,13,14,15,16,18,20,21,23,24,27],proxi:12,proxito:[7,16],publication_languag:15,publication_nam:15,publish:[15,23],publishedaft:[14,23],publishedbefor:[14,23],punctuat:24,puppi:18,purchas:9,purpl:14,purpos:13,put:[9,10,15,16,21],puzzl:23,pypi:24,pyt:16,pyth:16,python:[0,5,17,18,24,25,26,27],python_tweet:18,q:[7,14,18,23],q_80:15,qualifi:5,qualiti:[7,14],quantifi:21,queri:[0,8,10,13,14,15,18,23,24,25,26,27],query_:20,query_color:20,query_pric:20,query_s:20,query_tim:[8,24],querytim:[14,24],question:[2,6,15,18,21,22,24,27],question_mark:6,question_mark_count:6,question_mark_freq:6,question_mark_nam:6,question_marks_flat:6,question_marks_per_post:6,question_summari:6,question_text:6,questionnair:14,quick:[2,13,15],quickli:4,quit:[13,15,21],quot:22,quota:23,quotat:21,ra:15,race:[15,23],radio:15,radiu:18,rai:[7,16],rain:[6,21],rais:[16,24],ran:16,randolph:15,random:13,rang:[14,18],rank:[8,16,24,27],rapid:10,rate:[14,15,16,18,21,23],rate_limit_statu:18,rather:21,raw:11,rc2:7,re:[18,21],reachabl:16,read:[6,10,20],read_json:[7,13,16],read_parquet:10,readabl:[11,13,16,27],reader:10,readi:[9,18],readm:16,readthedoc:[7,16,18],real:18,realiti:13,realli:[7,9,10,16,21],reason:[4,7,10,13,16,24],receiv:[13,18],recent:[1,18,23],recip:[0,3,16,24,25],recommend:[6,10,16,18],recordingdetail:23,recurs:[7,15,16,24],red:[14,20],redirect:[10,16,24,27],redirect_from:10,redirect_reason:[7,16],redirect_tim:[7,16],redirect_to:10,redirect_ttl:[7,16],redirect_url:[7,16],refer:[7,8,10,14,16,18,20],referer_:10,referer_url_df:10,referr:[7,19],referrerpolici:[16,24],reflect:24,regard:[16,21],regardless:[14,23],regex:[0,5,6,10,11,21,24,25,27],regex_raw:11,regga:23,region:[16,18,23],regioncod:[14,23],regular:[0,5,6,10,16,21,24,25,26],reilli:11,reinvent:15,rel:[4,8,12,13,16,20,24,27],rel_valu:[21,24],relat:[6,9,14,15,16,23,27],relatedsit:14,relatedtovideoid:[14,23],relayout:24,releas:24,relev:[9,14,18,19,23],relevancelanguag:[14,23],reli:16,reliabl:8,religion:23,remain:[2,15,22],remaind:[2,24],remark:16,rememb:16,remov:[14,16,18,21,22,23,24],renam:20,render:27,repeat:[6,20,24],repetit:6,replac:[1,10,15,20,24,27],repli:[18,23],repons:[24,27],report:[7,12,16,20,21,24,27],repres:[8,10,14,15,18],represent:18,request:[0,3,7,8,10,12,14,16,18,23,24,25,27],request_:10,request_dir_10:10,request_dir_11:10,request_dir_12:10,request_dir_13:10,request_dir_1:10,request_dir_2:10,request_dir_3:10,request_dir_4:10,request_dir_5:10,request_dir_6:10,request_dir_7:10,request_dir_8:10,request_dir_9:10,request_frag:10,request_headers_:16,request_headers_accept:[7,16],request_headers_cooki:16,request_headers_us:[7,16],request_hostnam:10,request_last_dir:10,request_netloc:10,request_path:10,request_port:10,request_queri:10,request_query_:10,request_query__:10,request_query_a:10,request_query_aam:10,request_query_abspath:10,request_query_act:10,request_query_adapt:10,request_query_ag:10,request_query_albid:10,request_query_cmd:10,request_query_cod:10,request_query_cont:10,request_query_control:10,request_query_cpabc_calendar_upd:10,request_query_curpath:10,request_query_currentset:10,request_query_dir:10,request_query_dn:10,request_query_email:10,request_query_fil:10,request_query_file_link:10,request_query_filenam:10,request_query_filepath:10,request_query_findcli:10,request_query_fn:10,request_query_folderid:10,request_query_format:10,request_query_funct:10,request_query_gid:10,request_query_id:10,request_query_img:10,request_query_index:10,request_query_input_fil:10,request_query_item:10,request_query_itemid:10,request_query_lang:10,request_query_libpath:10,request_query_mod:10,request_query_mypath:10,request_query_nam:10,request_query_next_fil:10,request_query_nocontinu:10,request_query_op:10,request_query_opt:10,request_query_ord:10,request_query_p:10,request_query_pag:10,request_query_panel:10,request_query_path:10,request_query_posit:10,request_query_psd:10,request_query_q:10,request_query_redirect:10,request_query_ref:10,request_query_rid:10,request_query_sb_categori:10,request_query_scopenam:10,request_query_search_kei:10,request_query_servic:10,request_query_short:10,request_query_sit:10,request_query_srt:10,request_query_step:10,request_query_stockcodeintern:10,request_query_target:10,request_query_term:10,request_query_thumb:10,request_query_titl:10,request_query_todo:10,request_query_typ:10,request_query_typeid:10,request_query_url:10,request_query_usernam:10,request_query_v:10,request_query_var:10,request_query_wt:10,request_query_xdebug_session_start:10,request_schem:10,request_url:10,request_url_df:10,requir:[10,14,15,16,18,19,23],rerun:4,resampl:15,research:[9,13,27],resolut:[14,23],resourc:[10,14,16,18,23,27],resourceid:23,resp_headers_:16,resp_headers_access:16,resp_headers_ag:[7,16],resp_headers_alt:7,resp_headers_cach:[7,16],resp_headers_cf:[7,16],resp_headers_cont:[7,16],resp_headers_d:[7,16],resp_headers_etag:7,resp_headers_expect:[7,16],resp_headers_expir:[7,16],resp_headers_last:[7,16],resp_headers_permiss:7,resp_headers_referr:7,resp_headers_serv:[7,16],resp_headers_strict:[7,16],resp_headers_vari:[7,16],resp_headers_via:7,resp_headers_x:[7,16],resp_meta_:24,respect:[2,4,10,16,18,21,24],respons:[0,8,10,13,14,15,16,18,23,24,25,26,27],rest:[6,8,13],restaur:6,restrict:[2,8,14,16,18,23,24],result:[0,1,4,5,10,13,15,16,18,20,21,23,24,25,26,27],result_typ:18,resultscor:8,resum:[0,3,25,27],retain:[9,20],retreiv:[4,15,24],retriev:[14,15,18,23],returnd:24,retweet:[18,21],retweeted_of_m:18,retweets_of_m:18,reus:[14,23],reveal:15,revenu:21,revers:[0,10,14,18,23,24,25,26],reverse_dns_lookup:[10,12,24,27],review:[10,14,15,23],rewrit:24,rfc:[14,23],rhythm:23,rich:[15,18],richer:16,right:[9,10,14,15,20],right_char:6,rio:9,risk:15,rm_word:21,rn:15,rnkt7myjj7hcnsvbnzg9qdqizefftx9ytz3:7,robot:[0,3,10,15,16,24,25,26,27],robots_output_fil:13,robots_url:13,robotsfiles_df:13,robotstxt:24,robotstxt_df:13,robotstxt_last_modifi:[13,24],robotstxt_obei:[4,7],robotstxt_test:[13,24],robotstxt_test_df:13,robotstxt_to_df:[13,24],robotstxt_url:13,robotx:13,rock:23,rogen:15,role:[20,23],rolling_new:15,romanian:[14,17,24],root:18,row:[9,10,13,14,15,21],rtd:[7,16],rtl:6,rule:[0,3,7,10,13,16,20,25,27],run:[0,4,5,8,9,12,13,14,15,16,18,20,21,24,25,26,27],russia:15,russian:[14,15,17,24],s22:15,s:[0,1,2,4,6,7,9,10,13,14,15,16,18,20,21,23,24,25,26,27],safari:10,safe:[14,18],safesearch:[14,23],safeti:14,safetycheck:13,sai:[9,14,16,21,27],said:[6,13],sail:[14,23],sale:21,same:[0,1,2,3,5,6,8,9,10,13,14,15,16,18,20,21,23,24,25,27],sampl:[5,8,15,16],sample_log:10,samsung:15,sara:15,satisfi:10,save:[0,3,7,10,13,16,24,25,27],scale:[0,12,24,25,26],scari:18,scenario:2,schauspielerin:8,schema:8,scheme:[15,20],scienc:[15,27],scientist:27,score:[8,21],scrape:[0,3,10,16,24,25],scraper:10,scrapi:[7,16,27],screen:18,screen_nam:18,script:[4,7],script_src:4,sd:[14,23],seahawk:15,search:[0,7,8,13,15,18,19,20,23,24,25,26,27],search_us:18,searchterm:23,searchtyp:14,seattl:15,sec:16,second:[2,4,6,8,9,14,16,20,24,27],section:[13,14,23],secur:[7,16],see:[2,4,5,6,8,12,13,14,15,16,18,20,21,22,23],seem:[15,16,21],seen:10,segment:[9,18],selecotr:16,select:[10,14,16,18,23],selector:[0,24,25,26,27],selector_1:16,selector_2:16,self:20,sell:[9,15],sem:[0,16,24,26],sem_campaign:9,semi:18,semrush:27,senat:15,senatewinn:15,send:[8,10,18,27],sendfil:[7,16],sens:[20,21],sensit:[4,9,18],sent:[14,18,23],sentenc:[6,21],seo:[0,3,8,9,13,15,21,24,26],seop:8,seoul:8,sep:[2,24],separ:[2,6,10,14,16,18,20,23,24],sequenc:21,serbian:14,seri:15,seriou:21,serp:[0,8,20,24,25,26,27],serp_:[14,27],serp_goog:[14,16,24,27],serp_youtub:[14,24],serv:[7,16],server:[0,3,7,10,12,14,16,23,25],servic:[5,8,9,14,15],session:[10,14,18],set:[0,2,3,7,8,9,10,14,15,18,20,21,22,23,24,25,26,27],set_auth_param:18,set_index:15,set_logging_level:14,seth:15,setup:[0,24,25,26],sever:[0,4,7,10,14,18,21,23,24,25,26,27],seznambot:13,shape:[10,15],share:[11,16,21],shatel:12,she:21,sheet:[24,27],shift:9,shoe:[16,21],shop:[2,16],shorter:[2,23,24],should:[1,4,6,7,8,13,14,16,18,21,23],shouldn:[9,10],show:[5,6,8,9,10,14,16,20,21,23,24],show_list:18,show_owned_list:18,shown:[8,20],si:15,side:[10,21,22],sidebar:[16,24],sidebar_link:16,sidebar_links_url:16,sign:[6,13,16,20,22],signatur:18,signifi:9,similar:[1,6,16,20,23,24],similarli:[14,16,23],simpl:[4,5,6,7,12,15,16,18,21,27],simpler:24,simplest:[16,20],simpli:[4,9,10,12,13,15,16,21],simplifi:[7,14,23],simul:23,simultan:16,sinc:[1,2,6,7,15,16,18,21],since_id:18,sine:7,singapor:1,singl:[10,13,14,16,18],singular:6,sinhala:[17,24],site:[4,9,13,14,15,16,20,21,23,24,27],site_crawl:16,site_scraping_tos_term:13,sitemap:[0,13,16,20,24,25,26,27],sitemap_df:15,sitemap_download:24,sitemap_last_modifi:[15,24],sitemap_size_mb:[15,24],sitemap_to_df:[15,16,24],sitemap_url:15,sitemapindex:24,sitename_crawl_yyyy_mm_dd:16,sitesearch:14,sitesearchfilt:14,sitmeapindex:15,situat:20,sivasubramanian:15,six:[2,21],sixti:21,size:[7,10,13,14,15,16,18,20,24],skateboard:15,skin:5,skip:[16,24],skip_statu:18,skip_url_param:24,slectorgadget:16,slice:18,slight:24,slot:[1,2,24,27],slovak:14,slovenia:5,slovenian:14,slow:[0,3,25],slug:[15,18,20],slurp:13,sm:20,small:[5,13,14,23],smaller:[15,23,24],smartphon:[10,15],smile:5,smilei:5,snippet:[14,16,23,24],snow:[6,21],so:[0,2,3,6,7,8,9,10,13,14,15,16,18,20,21,23,25,27],social:[5,6,16,17,20,21],societi:23,softwareappl:8,solut:4,some:[4,5,6,7,10,12,13,14,15,16,18,20,21,23,24,27],somehow:21,someon:21,someth:[1,2,21],sometim:[2,4,9,13,16,21,27],somewher:[21,27],soon:13,sophist:27,sort:[14,17,20,21,23,24],soul:23,sourc:[1,2,5,6,7,8,9,10,12,13,14,15,16,18,19,20,21,22,23],source_fil:10,south:8,space:[2,14,15,18,22],spaci:[17,24],spam:23,span:[16,24],spanish:[6,14,17,24],speak:14,special:[6,15,16,20,24,27],specif:[7,14,18,23,27],specifi:[0,2,3,6,8,10,13,14,16,18,22,23,24,25,27],speed:[7,16,24],spend:[18,27],spent:27,spider:[0,4,7,10,24,25,26,27],split:[0,2,10,15,16,21,22,24,25,26,27],sport:[5,15,23],spread:27,squar:5,square_bann:19,src:[4,16,24],srcset:[16,24],ss:23,stage:10,standard:[14,16,18,20,23,27],star:[1,15],start:[2,4,6,7,9,10,14,15,16,18,21,23,24,27],start_request:7,starting_out:18,stat:[4,5,6,24],state:[8,14,15,20,23],static01:15,statist:[5,6,12,23,24,27],statu:[0,5,10,16,18,23,24,25,26,27],status:18,stdout:10,stearn:15,step:[8,22],still:[2,14,15,18,21,23],stiller:15,stitch:27,stop:[0,3,16,21,24,25,27],stopword:[0,21,24,25,26,27],storag:[10,15],store:[10,16],str:[1,2,5,6,7,9,10,13,15,16,18,19,21],straight:7,straightforward:[6,16,20],strateg:[15,27],strategi:[0,3,7,9,13,15,16,23,25],stream:18,strict:[14,23],stricter:24,string:[1,2,5,6,8,9,11,14,18,19,22,23,24],stringify_id:18,strip:[18,21,22],strongli:[16,18],structur:[0,4,7,9,15,18,24,25,26,27],stuff:[2,27],style:[13,16,24],stylesheet:4,sub:[0,3,5,6,10,13,15,16,18,20,24,25,27],sub_group:5,subdomain:[7,16],submodul:[16,24,25,26],subpackag:[24,25,26],subscrib:[18,23],subscribersnippet:23,subscript:[18,23],subscription_order_relev:23,subscriptions_list:23,subsequ:[14,23],subset:15,substr:8,suchmaschinenmarket:8,suchmaschinenoptimierung:8,suggest:[4,20,23],suit:10,suitabl:8,sulli:8,summar:[5,6,10],summari:[5,6,24],summer_promo:19,superhero:18,suppli:[12,14,24],support:[0,7,13,14,16,18,23,24,25,26,27],suppos:[13,20],sure:[0,1,2,3,6,7,12,14,16,18,20,24,25],surround:[6,24],surrounding_text:6,survei:14,susan:15,suspend:18,svc:7,swami:15,swedish:[14,17,24],sy:10,symbol:[5,6,24],syndic:[14,23],system:[10,24],sytem:20,sz:23,t:[0,1,3,6,7,9,10,14,16,20,21,22,24,25,27],tabl:[8,9,16,27],tablet:15,tackl:27,tag:[4,7,13,14,15,16,23,24,27],tagalog:[17,24],tail:9,take:[2,4,6,8,9,10,13,15,16,18,20,21,24,27],talk:2,tamil:[17,24],target:[9,23],task:[7,9,21,22,27],tatar:[17,24],tc2:15,teach:15,teal:14,team:15,technic:[8,27],techniqu:[4,21,27],technolog:[8,23],tediou:[9,20],telegrambot:13,tell:16,telugu:[17,24],templat:[1,2,15],temporari:10,ten:[14,21],tenni:23,teoma:13,term:[14,16,19,23,27],test:[0,5,24,25,26],tester:[0,24,25,26],text:[0,1,4,7,10,16,17,18,22,23,24,26],text_ad:2,text_list2:21,text_list:[5,6,21,22],textformat:23,textual:[5,6],thai:[17,24],than:[1,2,13,14,16,18,21,23,24,27],thei:[4,6,10,12,13,14,15,16,18,20,21,22,23,24],them:[0,2,3,6,7,9,10,12,13,15,16,18,20,21,24,25,27],themselv:[21,24],thenc:21,thereaft:21,therebi:[21,23],therefor:[4,14,21,23],therein:21,thereupon:21,thi:[1,2,4,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,24,25,27],thing:[1,2,6,8,9,15,16,20,22,25,27],think:[16,20],third:[16,18,21],those:[0,2,3,7,8,9,10,12,13,14,15,16,20,21,23,24,25,27],though:[13,14,16,18,21,23],thought:8,thousand:[4,5,7,12,21,27],thread:[15,23,24],three:[1,4,6,15,16,18,20,21,24,27],through:[4,7,10,13,14,15,16,18,21,22,23,27],throughout:21,thru:21,thu:[7,16,21],ticket:14,time:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,18,21,23,24,27],timecr:23,timelin:18,timeout:24,timestamp:10,tini:13,tip:7,titl:[4,6,9,14,16,20,21,23,24,27],tl:10,tld:[14,24],to_datetim:10,to_parquet:10,toctre:16,todai:[1,5,6],togeth:[5,6,10,13,18,20,21,27],token:[0,21,24,25,26],token_typ:18,tokyo:1,tolist:[13,15],tommi:15,tone:5,too:[0,3,16,21,25,27],took:16,tool:[0,7,10,14,15,16,20],top:[0,5,6,8,9,10,12,14,15,16,18,20,21,23,24,25,26,27],top_bot:10,top_currency_symbol:6,top_domain:6,top_emoji:5,top_emoji_categori:24,top_emoji_group:5,top_emoji_sub_categori:24,top_emoji_sub_group:5,top_emoji_text:5,top_exclamation_mark:6,top_hashtag:6,top_ment:6,top_numb:6,top_question_mark:6,top_tld:6,top_url:6,top_word:6,topic1:20,topic2:20,topic:[14,15,18,20,23,24],topic_1:20,topic_2:20,topicdetail:23,topicid:[14,23],tor:10,total:[2,10,13,21],tourism:23,toward:[18,21],town:24,toyota:[1,9],traceback:1,track:[23,24,27],tracker:15,tradit:[14,23],traffic:[16,18,19],trail:22,train:6,transport:[7,15,16],travel:5,trend:[18,21,27],tricki:16,trigger:4,trim:22,trim_us:18,trip:9,truestatus:18,truncat:16,turkc:15,turkish:[14,17,24,27],turn:14,tutor:9,tutori:[9,16,27],tv:[15,23],tw:14,tweet:[17,18,21,27],tweet_:18,tweet_mod:18,twelv:21,twenti:[9,13,21],twice:[0,3,21,24,25],twimg:18,twitter:[0,4,7,13,16,19,24,25,26,27],twitterbot:[10,13],two:[1,2,4,6,9,11,13,14,16,20,21,23,24,27],twtr_content:4,twtr_name:4,twython:[18,24],txt:[0,3,5,10,15,16,24,25,26,27],type:[4,6,7,8,9,10,14,16,18,20,23,24,27],typic:[1,2,6,7,10,12,14,15,16,18,20,21,23,27],ua:10,ua_:10,ua_devic:10,ua_df:10,ua_famili:10,ua_major:10,ua_minor:10,ua_o:10,ua_pars:10,ua_patch:10,ua_str:10,ubuntu:7,ug:17,uk:14,ukchina:15,ukrainian:[17,24],ultra:15,unalign:20,und:10,under:[4,7,8,10,13,21,24],underscor:15,understand:[8,9,13,14,15,18,20,27],understood:8,unexpect:16,unicod:[5,11],unifi:24,uniqu:[23,24],unique_currency_symbol:6,unique_emoji:5,unique_exclamation_mark:6,unique_hashtag:6,unique_ment:6,unique_numb:6,unique_question_mark:6,unique_url:6,unique_word:6,unit:[14,15,18,23],unknown:[10,12],unless:[13,21],unlik:20,unlock:16,unnest:18,unpack:15,unread:23,unsign:[14,23],unspecifi:14,until:[18,21],unusu:20,up:[2,7,8,9,14,16,18,20,21,24,27],upcom:[14,23,27],updat:[4,15,24],upload:[9,14,15,18,23],upon:21,urdu:[15,17,24],uri:[7,16],url:[0,2,4,6,7,8,10,11,13,14,15,18,21,23,24,25,26,27],url_:27,url_build:16,url_count:6,url_df:15,url_freq:6,url_list:[4,7,10,16],url_path:13,url_redirected_to:24,url_summari:6,url_to_df:[10,15,20,24,27],url_utm_ga:[19,24],urls_flat:6,urls_per_post:6,urls_to_test:13,urlth:14,urlyt:10,us:[0,1,4,5,6,7,9,10,11,12,13,14,15,16,17,18,20,21,23,24,25,26,27],usa:14,usag:[5,6,16,18,27],usd:6,usemap:[16,24],user:[0,3,6,9,10,12,14,16,18,23,24,25,26,27],user_:18,user_ag:[4,7,10,13,16],user_agent_pars:10,user_id:18,user_ment:18,user_timelin:18,userag:13,usernam:23,usual:[4,8,12,18,20,21],usuali:10,utc:15,utf:[7,18],util:[2,18],utm:[19,24],utm_campaign:19,utm_cont:19,utm_medium:19,utm_sourc:19,utm_term:19,v11:11,v13:[5,24],v1642801328:15,v1644335726:15,v1644381627:15,v1644418652:15,v1644595412:15,v1:8,v271:15,v274:15,v281:15,v282:15,v285:15,v286:15,v290:15,v2_0_0m1638886228:10,vacanc:9,valid:[6,14,18,19,23],valu:[2,4,7,8,10,14,15,16,18,20,21,23,24],value_count:[10,15],valueerror:[1,24],variabl:24,varieti:18,variou:[5,6,7,15,21,24],ve:24,veget:5,vegetable_emoji:5,vegur:7,vehicl:23,verb:9,veri:[1,4,7,8,9,10,12,13,15,16,18,20,21,24,27],verifi:[12,15],versatil:24,version:[7,10,16,24],via:[14,18,21,23],vid_id:14,video:[0,13,14,18,21,23,24,25,26,27],video_categories_list:23,video_content_loc:15,video_descript:15,video_dur:15,video_expiration_d:15,video_publication_d:15,video_thumbnail_loc:15,video_titl:15,videocapt:[14,23],videocategori:23,videocategoryid:[14,23],videocount:[14,23],videodefinit:[14,23],videodimens:[14,23],videodur:[14,23],videoembedd:[14,23],videoid:23,videolicens:[14,23],videos_list:23,videosynd:[14,23],videotyp:[14,23],vietnames:[15,17,24],view:[8,14,18,21,23],viewcount:[14,23],viewer:[14,23],viewport:[4,16,24],vine:18,violat:23,virginia:15,visual:27,vmi660635:10,volleybal:23,von:8,vp:15,vs:[0,15,25],w3c:16,w:[7,14,15],w_320:15,wa:[4,5,6,10,13,15,16,18,21,24],wai:[2,4,6,7,10,15,16,18,20,24,27],wait:[4,16],walk:15,wall:10,want:[0,1,2,3,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,25,27],warn:14,watch:[1,15,18],we:[2,8,9,10,13,15,16,20,21,27],web000079:16,web00007a:16,web00007c:16,web00007g:16,web00007h:16,web00007k:16,web:[7,8,14,15,16,17],webpag:[14,23],websit:[0,3,8,10,13,14,15,16,23,24,25,27],website_name_crawl_1:4,website_name_crawl_2:4,wed:16,week:[14,15,18,27],weight:[0,24,25,26,27],well:[6,7,9,10,12,13,14,15,16,18,20,21,22,23,24,27],went:10,were:[10,14,15,18,21,23,24],weren:10,west:15,what:[2,4,5,6,7,8,9,10,12,13,15,16,18,20,21,27],whatev:[21,27],when:[1,4,6,7,8,10,13,14,15,16,18,21,23,24,27],whenc:21,whenev:21,where:[2,4,6,7,10,14,15,16,18,20,21,24,27],wherea:21,whereaft:21,wherebi:21,wherein:21,whereupon:21,wherev:21,whether:[1,2,4,6,8,9,10,13,14,15,16,18,20,21,23,24],which:[2,4,6,7,8,10,13,14,15,16,17,18,20,21,22,23,24,27],whichev:[16,20,24],white:[14,22],whitespac:[2,21,22,24],whither:21,who:[4,6,13,14,15,18,21,23],whoever:21,whole:[5,7,16,21],whom:[18,21],whose:[14,21],why:[4,10,13,21],width:[16,23,24],wilson:15,win64:10,win:[15,21],window:[10,16],wire:15,wired_autocomplet:15,wired_first:15,wired_reinv:15,wired_seth:15,wired_video:15,wired_wir:15,within:[1,2,9,14,16,18,21,22,23],without:[4,7,14,16,21,23,24,27],woeid:18,won:[4,27],word:[0,1,2,5,6,8,9,10,14,15,18,24,25,26,27],word_count:6,word_freq:6,word_frequ:[21,22,24,27],word_summari:6,word_token:[22,24],words_flat:6,words_per_post:6,words_to_extract:6,words_to_find:6,work:[4,6,8,9,10,13,16,18,21,23,27],worker:[12,15],world:15,worldnew:15,worri:[4,13],worth:5,would:[2,4,6,10,13,14,15,16,18,20,21,23],wrangl:27,wrap:24,wrestl:23,write:2,written:[6,13,14,15],wrong:[10,13],wtd_freq:[21,24],wtd_freq_perc:21,wtd_freq_perc_cum:21,www:[5,6,7,10,13,15],x11:10,x64:10,x86_64:10,x:[8,9,10,14,15,16,27],xhtml:[7,16],xlarg:14,xm:16,xml:[0,7,13,20,24,25,26,27],xpath:[0,3,24,25,26,27],xpath_selector:[16,24],xxlarg:14,y:[10,14],yahoo:18,yandex:13,yandexbot:10,ye:[7,8],yea:8,year:[14,15,18],yellow:[5,14],yet:[9,16,20,21],yeti:13,york:15,you:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,25,27],your:[2,4,5,6,7,8,9,10,12,13,14,16,18,19,20,21,23,25],your_app_kei:18,your_app_secret:18,your_cx:14,your_google_developer_kei:8,your_kei:14,your_oauth_token:18,your_oauth_token_secret:18,your_user_ag:4,yourself:[16,21],yourselv:21,yout:20,youtub:[0,8,21,24,25,26,27],youtube_channel_detail:14,youtube_video_detail:14,youuuuuu:6,youuuuuuu:6,yymmdd_article_titl:15,yyyi:[15,18,23],z:10,zero:[8,14,16,23],zgrab:10,zh:[14,23],ziggozakelijk:10,zip:[10,24],zs:15},titles:["advertools package","Create Ads on a Large Scale","Create Ads Using Long Descriptive Text (top-down approach)","advertools.code_recipes package","\ud83d\udd77 SEO Crawling & Scraping: Strategies & Recipes","Emoji: Extract, Analyze, and Get Insights","Extract structured entities from text lists","\ud83d\udd77 Python Status Code Checker with Response Headers","Import and Analyze Knowledge Graph Results on a Large Scale","Generate Keywords for SEM Campaigns","Log File Analysis","Regular Expressions for Extracting Structured Entities","Reverse DNS Lookup in Bulk","\ud83e\udd16 Analyze and Test robots.txt Files on a Large Scale","Import Search Engine Results Pages (SERPs) for Google and YouTube","Download, Parse, and Analyze XML Sitemaps","\ud83d\udd77 Python SEO Crawler / Spider","Stopwords in Several Languages","Twitter Data API","URL Builders","Split, Parse, and Analyze URL Structure","Text Analysis","Tokenize Words (N-grams)","YouTube Data API","advertools","advertools","advertools","advertools: productivity & analysis tools to scale your online marketing"],titleterms:{"0":24,"01":24,"02":24,"03":24,"04":24,"05":24,"06":24,"07":24,"08":24,"09":24,"1":24,"10":24,"11":24,"12":24,"13":24,"14":24,"17":24,"18":24,"19":24,"2":24,"2018":24,"2019":24,"2020":24,"2021":24,"2022":24,"21":24,"23":24,"25":24,"26":24,"27":24,"29":24,"3":24,"30":24,"31":24,"4":24,"5":24,"6":24,"7":24,"8":24,"9":24,"do":4,"function":[6,10,16,18],"import":[8,14],"long":2,"new":[15,16],"while":[4,16],On:16,The:20,absolut:21,account:8,ad:[1,2],addit:16,advertool:[0,3,24,25,26,27],agent:[4,13],analysi:[10,21,25,27],analyt:16,analyz:[5,8,10,13,15,20],api:[8,18,23],approach:[2,13,16],articl:[2,16],audit:4,authent:18,automat:4,base:4,behavior:16,builder:19,bulk:[12,13],campaign:[9,27],can:4,certain:4,chang:[24,25],checker:7,code:7,code_recip:3,concurr:4,condit:4,consol:16,content:[0,3,25,27],control:4,convent:27,copi:4,count:21,crawl:[4,10,16],crawler:16,creat:[1,2],css:16,custom:[4,16],data:[10,16,18,23],datafram:10,depth:4,descript:2,determin:16,di:4,directori:20,discoveri:16,dn:12,domain:4,don:4,down:[2,4],download:15,element:16,emoji:5,engin:14,entiti:[6,11],express:[4,11],extract:[4,5,6,11,16],facebook:2,feed:2,file:[10,13],follow:[4,16],format:10,frequenc:21,from:[4,5,6],gener:9,get:5,googl:[2,8,14,16],gram:22,graph:8,hard:4,header:7,hit:4,how:[4,8,10],i:4,includ:4,index:[15,25],indic:25,insight:5,instal:27,instant:2,its:4,job:4,keyword:9,knowledg:8,languag:17,larg:[1,8,13],later:4,link:[4,16],list:[4,6,16],log:[4,10,24,25],logs_to_df:10,lookup:12,make:4,market:[25,27],media:[25,27],mode:[4,16],modul:[0,3],multipl:4,my:4,n:22,number:4,obei:4,onli:4,onlin:[25,27],packag:[0,3],page:[4,14,16],paramet:[16,20],pars:[10,15,20],path:20,pattern:16,paus:4,pre:16,prepar:10,product:[25,27],python:[7,16],queri:[16,20],recip:4,regex:16,regular:[11,15],request:4,respons:7,result:[8,14],resum:4,revers:12,robot:[4,13],rule:4,run:10,s:8,same:4,save:4,scale:[1,8,13,27],scrape:4,search:[5,14,16],selector:16,sem:[9,25,27],seo:[4,16,25,27],serp:[14,16],server:4,set:[4,16],setup:8,sever:17,sitemap:15,slow:4,so:4,social:[25,27],specifi:4,spider:16,split:20,statu:7,stop:4,stopword:17,strategi:4,structur:[6,11,20],sub:4,submodul:[0,3],subpackag:0,support:10,sure:4,t:4,tabl:25,test:13,tester:13,text:[2,5,6,21,25,27],them:4,those:4,token:22,too:4,tool:[25,27],top:2,twice:4,twitter:18,txt:[4,13],url:[16,19,20],us:[2,8],user:[4,13],video:15,vs:21,want:4,websit:4,weight:21,word:[21,22],xml:15,xpath:[4,16],your:27,youtub:[14,23]}}) \ No newline at end of file +Search.setIndex({docnames:["advertools","advertools.ad_create","advertools.ad_from_string","advertools.code_recipes","advertools.code_recipes.spider_strategies","advertools.emoji","advertools.extract","advertools.header_spider","advertools.knowledge_graph","advertools.kw_generate","advertools.logs","advertools.regex","advertools.reverse_dns_lookup","advertools.robotstxt","advertools.serp","advertools.sitemaps","advertools.spider","advertools.stopwords","advertools.twitter","advertools.url_builders","advertools.urlytics","advertools.word_frequency","advertools.word_tokenize","advertools.youtube","include_changelog","index","modules","readme"],envversion:{"sphinx.domains.c":2,"sphinx.domains.changeset":1,"sphinx.domains.citation":1,"sphinx.domains.cpp":4,"sphinx.domains.index":1,"sphinx.domains.javascript":2,"sphinx.domains.math":2,"sphinx.domains.python":3,"sphinx.domains.rst":2,"sphinx.domains.std":2,"sphinx.ext.viewcode":1,sphinx:56},filenames:["advertools.rst","advertools.ad_create.rst","advertools.ad_from_string.rst","advertools.code_recipes.rst","advertools.code_recipes.spider_strategies.rst","advertools.emoji.rst","advertools.extract.rst","advertools.header_spider.rst","advertools.knowledge_graph.rst","advertools.kw_generate.rst","advertools.logs.rst","advertools.regex.rst","advertools.reverse_dns_lookup.rst","advertools.robotstxt.rst","advertools.serp.rst","advertools.sitemaps.rst","advertools.spider.rst","advertools.stopwords.rst","advertools.twitter.rst","advertools.url_builders.rst","advertools.urlytics.rst","advertools.word_frequency.rst","advertools.word_tokenize.rst","advertools.youtube.rst","include_changelog.rst","index.rst","modules.rst","readme.rst"],objects:{"":[[0,0,0,"-","advertools"]],"advertools.ad_create":[[1,1,1,"","ad_create"]],"advertools.ad_from_string":[[2,1,1,"","ad_from_string"]],"advertools.code_recipes":[[4,0,0,"-","spider_strategies"]],"advertools.emoji":[[5,1,1,"","emoji_search"],[5,1,1,"","extract_emoji"]],"advertools.extract":[[6,1,1,"","extract"],[6,1,1,"","extract_currency"],[6,1,1,"","extract_exclamations"],[6,1,1,"","extract_hashtags"],[6,1,1,"","extract_intense_words"],[6,1,1,"","extract_mentions"],[6,1,1,"","extract_numbers"],[6,1,1,"","extract_questions"],[6,1,1,"","extract_urls"],[6,1,1,"","extract_words"]],"advertools.header_spider":[[7,2,1,"","HeadersSpider"],[7,1,1,"","crawl_headers"]],"advertools.header_spider.HeadersSpider":[[7,3,1,"","custom_settings"],[7,4,1,"","errback"],[7,3,1,"","name"],[7,4,1,"","parse"],[7,4,1,"","start_requests"]],"advertools.knowledge_graph":[[8,1,1,"","knowledge_graph"]],"advertools.kw_generate":[[9,1,1,"","kw_broad"],[9,1,1,"","kw_exact"],[9,1,1,"","kw_generate"],[9,1,1,"","kw_modified"],[9,1,1,"","kw_neg_broad"],[9,1,1,"","kw_neg_exact"],[9,1,1,"","kw_neg_phrase"],[9,1,1,"","kw_phrase"]],"advertools.logs":[[10,1,1,"","crawllogs_to_df"],[10,1,1,"","logs_to_df"]],"advertools.reverse_dns_lookup":[[12,1,1,"","reverse_dns_lookup"]],"advertools.robotstxt":[[13,1,1,"","robotstxt_test"],[13,1,1,"","robotstxt_to_df"]],"advertools.serp":[[14,1,1,"","serp_goog"],[14,1,1,"","serp_youtube"],[14,1,1,"","set_logging_level"],[14,1,1,"","youtube_channel_details"],[14,1,1,"","youtube_video_details"]],"advertools.sitemaps":[[15,1,1,"","sitemap_to_df"]],"advertools.spider":[[16,1,1,"","crawl"]],"advertools.twitter":[[18,1,1,"","authenticate"],[18,1,1,"","get_application_rate_limit_status"],[18,1,1,"","get_available_trends"],[18,1,1,"","get_favorites"],[18,1,1,"","get_followers_ids"],[18,1,1,"","get_followers_list"],[18,1,1,"","get_friends_ids"],[18,1,1,"","get_friends_list"],[18,1,1,"","get_home_timeline"],[18,1,1,"","get_list_members"],[18,1,1,"","get_list_memberships"],[18,1,1,"","get_list_statuses"],[18,1,1,"","get_list_subscribers"],[18,1,1,"","get_list_subscriptions"],[18,1,1,"","get_mentions_timeline"],[18,1,1,"","get_place_trends"],[18,1,1,"","get_retweeters_ids"],[18,1,1,"","get_retweets"],[18,1,1,"","get_supported_languages"],[18,1,1,"","get_user_timeline"],[18,1,1,"","lookup_status"],[18,1,1,"","lookup_user"],[18,1,1,"","make_dataframe"],[18,1,1,"","retweeted_of_me"],[18,1,1,"","search"],[18,1,1,"","search_users"],[18,1,1,"","set_auth_params"],[18,1,1,"","show_lists"],[18,1,1,"","show_owned_lists"]],"advertools.url_builders":[[19,1,1,"","url_utm_ga"]],"advertools.urlytics":[[20,1,1,"","url_to_df"]],"advertools.word_frequency":[[21,1,1,"","word_frequency"]],"advertools.word_tokenize":[[22,1,1,"","word_tokenize"]],"advertools.youtube":[[23,1,1,"","activities_list"],[23,1,1,"","captions_list"],[23,1,1,"","channel_sections_list"],[23,1,1,"","channels_list"],[23,1,1,"","comment_threads_list"],[23,1,1,"","comments_list"],[23,1,1,"","guide_categories_list"],[23,1,1,"","i18n_languages_list"],[23,1,1,"","i18n_regions_list"],[23,1,1,"","playlist_items_list"],[23,1,1,"","playlists_list"],[23,1,1,"","search"],[23,1,1,"","subscriptions_list"],[23,1,1,"","video_categories_list"],[23,1,1,"","videos_list"]],advertools:[[1,0,0,"-","ad_create"],[2,0,0,"-","ad_from_string"],[3,0,0,"-","code_recipes"],[5,0,0,"-","emoji"],[6,0,0,"-","extract"],[7,0,0,"-","header_spider"],[8,0,0,"-","knowledge_graph"],[9,0,0,"-","kw_generate"],[10,0,0,"-","logs"],[11,0,0,"-","regex"],[12,0,0,"-","reverse_dns_lookup"],[13,0,0,"-","robotstxt"],[14,0,0,"-","serp"],[15,0,0,"-","sitemaps"],[16,0,0,"-","spider"],[17,0,0,"-","stopwords"],[18,0,0,"-","twitter"],[19,0,0,"-","url_builders"],[20,0,0,"-","urlytics"],[21,0,0,"-","word_frequency"],[22,0,0,"-","word_tokenize"],[23,0,0,"-","youtube"]]},objnames:{"0":["py","module","Python module"],"1":["py","function","Python function"],"2":["py","class","Python class"],"3":["py","attribute","Python attribute"],"4":["py","method","Python method"]},objtypes:{"0":"py:module","1":"py:function","2":"py:class","3":"py:attribute","4":"py:method"},terms:{"0":[4,5,6,7,8,9,10,11,12,13,14,15,16,20,21,23,25],"00":[10,13,14,15,23],"000":[14,18,22],"0000":10,"000000":21,"000b":16,"0039":16,"0043":16,"004a":16,"006f":16,"00954418":10,"00987329":10,"00a1":16,"00bf":16,"00c2":16,"00ce":16,"00e6":16,"00z":[14,15,23],"01":[13,14,15,23,25],"0126707":10,"0129998":10,"0133289":10,"0185":6,"0185947":10,"018jz":23,"018w8":23,"019582":10,"019_rr":23,"01a2":16,"01cgz":23,"01h6rj":23,"01h7lh":23,"01k8wb":23,"01lyv":23,"01sjng":23,"01t00":[14,23],"02":[7,13,15,25],"0213921":10,"021bp2":23,"022dc6":23,"024":[15,24],"024x1":24,"0253415":10,"025zzc":23,"0270483":7,"0271282":7,"027x7n":23,"0281389":10,"028sqc":23,"029949":10,"02d86a3cea00007e9edb0cf2000000":16,"02d86a3e0e00007e9edb0d72000000":16,"02d86a3e1300007ec2a808a2000000":16,"02d86a3e140000d437b81532000000":16,"02d86a3e150000d423322742000000":16,"02d86a494f0000d437b828b2000000":16,"02d86a4a7f00007e9edb13a2000000":16,"02d86a4a7f00007ec2a811f2000000":16,"02d86a4a7f0000d423209db2000000":16,"02d86a4a7f0000d423323b42000000":16,"02hygl":23,"02jjt":23,"02lkt":23,"02mscn":23,"02ntfj":23,"02vx4":23,"02vxn":23,"02wbm":23,"03":[13,15,25],"0315945":10,"032tl":23,"037hz":23,"03_d0":23,"03c3":16,"03glg":23,"03hf_rm":23,"03t17":15,"03tmr":23,"04":[7,15,25],"0403l3g":23,"0410tth":23,"041xxh":23,"0477209":10,"04q1x3q":23,"04rlf":23,"05":[15,16,25],"05qjc":23,"05qt0":23,"05rwpb":23,"06":[15,25],"06442":7,"064t9":23,"066667":21,"066wd":23,"068hy":23,"06bvp":23,"06by7":23,"06cqb":23,"06j6l":23,"06ntj":23,"07":[13,15,25],"0701004":10,"0710e93d610dd8c3":7,"0774069":15,"07_53":23,"07bs0":23,"07bxq":23,"07c1v":23,"07yv9":23,"08":[13,15,25],"08427":[14,23],"087985":13,"08t17":15,"09":[13,15,16,25],"090302_gazaconferenciaml":15,"090409_machienhuu_revisit":15,"090421_mqm_speaks_rza":15,"090524_paquistaoupdateg":15,"090618_tomtest":15,"090620_as_iraq_explosion_tc2":15,"090620_iraq_blast_tc2":15,"090622_me_egypt_us_tc2":15,"090622_me_worldbank_tc2":15,"090623_egitomilitaresfn":15,"090623_iz_cairo_russia_tc2":15,"090623_mz_leaders_lifespan_tc2":15,"090624_me_inpictures_brazil_tc2":15,"090624_mz_wimbledon_tc2":15,"090625_sf_tamim_verdict_tc2":15,"090628_rn_pakistani_soldiries_ambush":15,"090629_om_pakistan_report_tc2":15,"090715_hillary_iran_cq":15,"090723_ae_silwan_tc2":15,"090729_iraquerefenbritsfn":15,"090830_ugc_ddh_sand":15,"090831_dalailamataiwan":15,"090901_japecontask":15,"090901_putin_regret_pact":15,"090901_tiananmen_movi":15,"098wr":23,"09kqc":23,"09s1f":23,"09t13":15,"09t15":15,"09xp_":23,"0b1vjn":23,"0bzvm2":23,"0c79465a9793low":15,"0cff645fbb74c21791568b78a888967d":15,"0d790f23c36dlow":15,"0f2f9":23,"0g293":23,"0ggq0m":23,"0glt670":23,"0gywn":23,"0jm_":23,"0kt51":23,"1":[1,4,5,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,25],"10":[2,5,6,7,10,13,14,15,16,18,20,21,25],"100":[4,10,14,16,18,21],"1000":[14,23],"10000ft":[14,23],"101":10,"101e":16,"103":10,"104":[6,16],"105":10,"108":13,"1080p":[14,23],"1083":7,"109":10,"1090":10,"1095":10,"10968":15,"10t17":15,"11":[5,6,7,10,13,14,15,16,25],"110":10,"111111":21,"113":10,"1132":6,"1149":6,"1160":6,"117821":10,"118":10,"118614":7,"119":10,"11e1":15,"11t17":15,"12":[6,10,13,15,16,18,25],"1204":15,"1210":10,"122":[14,23],"123":6,"1234567890\u0660\u0661\u0662\u0663\u0664\u0665\u0666\u0667\u0668\u0669\u32ba\ud804\udc5b\ud800\udd0d\ud802\udcaa\u24f2\ud804\udc63\ud800\udd28\ud802\udd1b":[0,24,25,26],"124":27,"125":[2,12],"126":6,"1261":10,"1274":15,"1285":15,"129":10,"1293":15,"13":[2,5,6,7,8,10,13,15,25],"130":[2,10,12,15],"1306":8,"131k":27,"132":10,"13251":8,"13270":7,"133333":21,"1346":6,"135":10,"1350":15,"137":10,"13c3":16,"14":[6,8,10,13,15,25],"140":18,"14022":15,"1415":10,"143":10,"1435":8,"146":[10,13],"147":13,"148":13,"149":13,"149416":10,"14c904a172315a4922f4d28948b916c2":7,"15":[2,6,8,10,15,20,23],"150":13,"1500m":[14,23],"1506":15,"1509":8,"152":10,"1534":15,"154":10,"154258":10,"1545":10,"1555":15,"157":6,"1585538956622":15,"1585539039190":15,"1585539054298":15,"1585539172701":15,"1585539206866":15,"1585539237156":15,"1585539358901":15,"1585539536519":15,"159":6,"1595":6,"16":[4,6,10,13,15],"1605":6,"163":10,"164":10,"1647":16,"165":6,"1657":15,"1664":10,"1677":15,"17":[7,10,13,15,16,25],"170":[7,16],"171":10,"1727":6,"173":10,"174":10,"176":10,"177":10,"1777":10,"179":10,"179365":10,"18":[7,10,15,25],"180":[7,16],"182":10,"184":15,"185":[10,12],"1858":10,"189":6,"18c3":16,"19":[7,13,16,25],"191":8,"19142":8,"192":10,"1937":10,"194":[10,12],"1959":15,"196":10,"1970":[14,23],"1d9b91664204low":15,"1f1ee":5,"1f1f8":5,"1f32d":5,"1f33d":5,"1f340":5,"1f346":5,"1f3e9":5,"1f3fb":5,"1f3fc":5,"1f3fd":5,"1f3fe":5,"1f3ff":5,"1f415":5,"1f436":5,"1f48c":5,"1f499":5,"1f4d8":5,"1f535":5,"1f537":5,"1f539":5,"1f7e6":5,"1f91f":5,"1f94a":5,"1f951":5,"1f954":5,"1f955":5,"1f9ae":5,"1f9ba":5,"1f9e4":5,"1fad0":5,"1mb":15,"1winner":15,"2":[4,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,25],"20":[1,6,8,10,13,14,15,16,18,21,23,24],"200":[7,10,16,18,21],"2000":6,"200000":21,"200689":13,"2008":15,"2009":[15,16],"200d":5,"2010":15,"2011":15,"2012":15,"2013":15,"2014":[10,15],"2015":[15,17,18],"2016":[15,17],"2017":[15,23],"2018":[15,25],"2019":[15,25],"201e":16,"202":16,"2020":[13,15,16,25],"2021":[13,15,25],"2022":[7,10,13,15,25],"203":[8,10],"203191":8,"2074":10,"207504":10,"209":10,"20pct_off":19,"21":[6,10,13,14,15,16,18,19,25],"210":6,"2103":15,"211":[10,12],"2132":10,"214":10,"217":10,"2190":10,"22":[10,13,15],"222222":21,"223":10,"2240":10,"225":10,"226":10,"2287":15,"23":[10,13,15,16,25],"232845":10,"234":10,"237":10,"24":[13,15],"241":10,"243":[10,12],"244":10,"249":[10,12],"24c3":16,"25":[2,6,12,15,16,19,25],"250":21,"252":8,"254237":10,"2547":10,"257":6,"26":[1,6,7,10,16,19,25],"266667":21,"26837":7,"27":[7,13,15,23,25],"270":2,"273819":10,"2769":15,"279":6,"27t17":15,"28":[1,13],"2815":6,"283":13,"284":13,"285":13,"286":13,"287":13,"289":13,"29":[6,7,10,15,25],"290":[10,13],"291":13,"2910":15,"292":[13,15],"292414":10,"293":13,"2950":15,"2951":15,"2952":15,"2953":15,"2954":15,"2955":15,"2984":15,"2ad504a1":16,"2anam":19,"2d":[14,23],"2e3b74":16,"2e454f":16,"2e494d":16,"2e4ccb":16,"2e77d2":16,"2e93a0":16,"2ed585":16,"2ef5ef":16,"2f1d9f":16,"2f6d5c":16,"2nd":11,"3":[4,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,25],"30":[1,2,10,13,14,15,25],"300":21,"301":16,"302":[7,16],"3021":15,"305743":10,"31":[10,12,15,25],"3153":15,"31536000":[7,16],"316":8,"3166":[14,23],"318743":10,"32":[6,7,10,13,15,16],"321":[6,8],"3250":15,"33":[6,8,13],"3313":8,"331414":10,"333":6,"333333":21,"3339":[14,23],"3395":8,"34":8,"341287":10,"34be9bf74f00low":15,"34c3":16,"35":[8,10,16],"350831":10,"3561":15,"3587":8,"36":[10,13,16],"3600":16,"360375":10,"3665":6,"3682":15,"37":[6,14,15,23],"373":15,"375":12,"375724":13,"38":[10,16],"39":[10,12,13,15,16],"39687acb":15,"397":13,"398":13,"399":13,"3d":[14,23],"3f44":16,"3k":27,"4":[5,6,8,9,10,12,13,15,16,18,20,21,23,25],"40":[13,14,16],"400":[4,13,21],"401":13,"404":[10,16],"4044":10,"41":15,"41b0":15,"42":10,"4224":15,"42307":[14,23],"426":10,"4281":15,"43":15,"4312":8,"44":[10,13],"443":7,"4430":10,"444":6,"45":[10,14],"450":14,"456":6,"46":[10,15],"461037":15,"461815":13,"462":8,"466e":15,"468588":13,"4687":6,"47":10,"474456":13,"4758":10,"47603":15,"48":[10,13,15],"4883":15,"488ed635":15,"49":[6,8,10],"491":15,"49462":8,"499":10,"49994":15,"49995":15,"49996":15,"49997":15,"49998":15,"49999":15,"4c69":15,"4f34":15,"4f7bea3b":16,"4k":6,"5":[1,5,6,8,9,10,12,13,14,15,16,17,21,25],"50":[1,13,14,21,24],"500":[4,8,13,14,18,21,23],"5000":18,"5004":6,"501e":16,"5050":15,"5056":8,"505b":15,"5065":15,"5068":15,"5080":15,"5081":15,"5082":15,"5083":15,"5084":15,"5085":15,"51":[10,12,13],"510":15,"52":[13,15],"520":[10,15],"53":[8,10],"533":15,"536":13,"537":[10,13],"538":[13,27],"539":13,"54":[8,15],"540":13,"5403":15,"541":13,"545":15,"547":15,"55":[8,9,15],"554":15,"555":6,"556":15,"56":[9,10,12,13,15],"563":6,"565":15,"57":[9,13,15],"572":6,"5745":6,"576":8,"58":[9,10,13],"584":8,"59":9,"596daca7dbaa7e9":16,"596daca9b91fd437":16,"596daca9bcab7e9":16,"596daca9bddb7ec2":16,"596daca9bf26d423":16,"596dacbbb8afd437":16,"596dacbd980bd423":16,"596dacbd980cd423":16,"596dacbd99847ec2":16,"596dacbd9fb97e9":16,"5e":19,"5km":[14,23],"5x":10,"6":[5,6,8,10,12,13,15,21,25],"60":[10,12,13],"600000":21,"601":6,"604800":[7,16],"619bd9be1d75db41adee6b58":15,"6201430a1d75db06ae1f62e8":15,"620345a15577c23d46622256":15,"6203cd7b5577c23d19622259":15,"62067f085577c277dd9acf42":15,"625":[9,12],"626":9,"627":9,"628":9,"629":9,"630":9,"63124":15,"632":15,"635":15,"638":15,"639":[8,14,18,23],"64":[6,13],"640":15,"645":15,"6543":8,"66":[10,12,16],"6666666666666666":6,"6666666666666667":6,"666667":21,"67":[6,16],"673":6,"674":15,"68":[10,13,16],"683":15,"6853":8,"69":[10,16],"6dba2aae6b424107":7,"7":[5,6,8,10,12,13,15,18,21,25],"70":[10,16],"701e":16,"702814":13,"706":15,"716":10,"71756":8,"72":[6,10,13,23],"7200":7,"720a8581":16,"720p":[14,23],"727":15,"728x90":19,"729":10,"73":10,"733":6,"74":12,"744247":15,"745":10,"75":[4,5,6,10,12,13,16],"7549":8,"755":15,"75911c9e":16,"75mi":[14,23],"76":13,"769":15,"77":[10,13],"78":13,"789":6,"79":[10,13],"7a28ef3b":16,"7c":[14,23],"7ec3":16,"8":[4,5,6,7,8,10,12,13,15,16,18,21,25],"80":[10,12,21],"800000":21,"801e":16,"81":10,"815":15,"8192":23,"82":16,"83":10,"841":15,"841851":15,"85855c48":16,"8601":23,"86199":15,"862":15,"8635":6,"86400":7,"872":15,"874":15,"875":12,"8760":8,"8808":15,"882":15,"888889":21,"89":10,"9":[5,6,7,8,10,13,15,16,21,25],"90":[2,10],"9044":15,"908":10,"90b11f47f8b2ab57cb180cbd3c6f06f9":15,"91":12,"913":15,"914107":15,"91d0":15,"92":10,"933333":21,"94":10,"94f1":15,"951053":13,"96":12,"97":[6,12],"973":15,"98":10,"98b729fa":16,"99":[6,15],"995323":15,"9cbd":15,"9dfdd38a":16,"9e64":15,"\u00e0":1,"\u0294":[0,24,25,26],"\u03b5\u03af\u03c3\u03b1\u03b9":6,"\u03c0\u03ce\u03c2":6,"\u062a\u0630\u0647\u0628":6,"\u062d\u0627\u0644\u0643":6,"\u0643\u064a\u0641":6,"\u0644\u0627":6,"\u0645\u0631\u062d\u0628\u0627":6,"boolean":[8,14,16,23],"break":[6,15,18,24,27],"byte":[7,15,16,24],"c\u00f3mo":6,"case":[1,2,4,5,6,7,9,10,12,13,14,15,16,18,20,21,24,27],"char":1,"class":[7,16],"default":[2,4,6,8,9,10,14,15,16,18,21,22,23,24,27],"do":[0,2,3,6,7,9,10,12,13,14,15,16,18,20,21,23,25,27],"est\u00e1":6,"export":16,"final":[9,15,20,23,24],"float":[14,23],"function":[0,2,4,5,7,8,9,12,13,14,15,20,21,22,24,25,26,27],"haftungsbeschr\u00e4nkt":17,"import":[0,1,2,4,5,6,7,9,10,12,13,15,16,17,18,20,22,23,24,25,26,27],"int":[1,6,9,12,15,18,21],"long":[0,1,6,10,12,13,14,18,23,24,25,26,27],"new":[0,4,6,10,14,24,25,26,27],"null":18,"public":[5,7,16,18],"return":[1,2,5,6,7,8,9,10,12,13,14,15,18,19,20,21,22,23,24,27],"s\u00fcdkorea":8,"short":[2,14,21,23],"static":[10,13],"super":[7,10],"true":[1,2,4,6,7,9,10,13,14,15,16,18,20,21,23,24],"try":[10,13,14,16,21,23,27],"while":[0,3,10,14,18,20,21,23,24,25,26],A:[4,5,6,7,8,9,10,11,13,14,15,16,18,20,21,22,23,24,27],AND:14,And:[8,10],As:[1,4,12,13,15,20,21,22,23,27],At:[14,23],Being:7,But:[4,16,21],By:[10,14,16,21,23],For:[1,4,7,8,10,13,14,15,16,18,21,23],IS:[1,2],If:[2,4,6,7,8,10,14,15,16,18,20,21,23,24,25],In:[1,2,6,8,10,12,13,14,15,16,18,20,21,23,24,27],Is:[1,6,8,15],It:[4,6,7,8,9,10,12,14,15,16,18,20,21,23],NOT:[6,14,23],No:[6,14],Not:[5,18],ON:18,OR:[14,18,23,25,27],On:[0,2,18,24,25,26],One:[1,7,13,15,16,21],Or:[9,16,20],THE:19,That:[2,4,6,16,23],The:[0,2,4,5,6,7,8,9,10,12,13,14,15,16,18,21,22,23,24,25,26,27],Then:[16,18],There:[4,6,7,10,14,15,16,18,20,24,27],These:[4,10,16,21],To:[2,9,13,16,21,23,25],With:[7,15,18,21],_:15,__cfduid:16,__init__:24,_dash:10,_dict_product:24,_escaped_fragment_:13,_static:16,_to_df:27,a320:15,a850165d925db701988daf7ead7492d3:13,abbrevi:6,abil:[16,23,24],abl:[7,8,13,14],about:[2,4,5,6,7,10,12,13,14,15,16,18,20,21,23,24,25,27],abov:[4,8,16,18,20,21,24],abs_freq:[21,24],abs_perc:21,abs_perc_cum:21,abs_wtd_df:21,absolut:[0,12,13,20,24,25,26,27],accept:[7,14,16,23,24],access:[10,13,14,17,18,23,27],access_log:10,access_token:18,accid:4,accomplish:[21,27],accord:[13,22],account:[0,9,13,14,18,21,23,24,25,26],achiev:[4,22,27],across:[4,5,8,14,15,20,21,27],act:[14,23],action:[23,24],activ:[5,6,8,14,15,23],activities_list:23,actress:8,actriz:8,actual:[8,12,15,16,20,21,23],ad:[0,6,9,16,18,19,23,24,25,26,27],ad_:[16,27],ad_creat:[1,9,16,24,27],ad_from_str:[2,9,16,24,27],add:[4,7,10,16,21],add_prefix:10,addit:[0,2,6,10,12,14,18,21,23,24,25,26,27],addition:[16,18],addr:[10,12],address:[10,12,16,24,27],addressse:14,adgroup:9,administrativearea:8,adress:[10,12],adv:[1,2,4,5,6,7,9,10,12,13,15,16,17,18,20,21],adv_error:10,adv_log:10,adv_logs_fin:10,advantag:10,adventur:23,adver:[7,10,16],advertoo:16,advertool:[1,2,4,5,6,7,9,10,12,13,15,16,17,18,20],aerialmagzc:6,afaa7cb5e636low:15,affect:16,afghan:15,afghanistan:15,afraid:6,after:[2,4,6,14,15,16,18,20,21,22,23,27],afterward:21,ag:[7,16],again:[4,10,15,16,21],against:[8,18,21],agent:[0,3,7,10,12,16,24,25,26,27],aggreg:8,ahrefsbot:10,ai:15,aid:5,ajax:13,alert:7,algarv:1,algorithm:27,alias:8,aliaslist:[10,12],align:20,all:[2,4,5,6,7,8,9,10,13,14,15,16,18,20,21,23,24,27],allow:[1,2,7,10,13,14,16,18,23,24,27],allowed_domain:[4,16],allthreadsrelatedtochannelid:23,almost:[10,21],alon:21,along:[6,18,21],alpha:[14,23],alphabet:[8,14,23],alreadi:[4,21],also:[1,2,4,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,24,27],alt:[16,18,24],alt_href:[4,16],alt_hreflang:[4,16],altern:[4,13,16,24],although:[2,16,21],altogeth:10,alwai:[2,18,21],am:[5,21],amazon:[13,15,18],america:23,america_latina:15,american:23,among:21,amongst:21,amount:[16,21],amp:15,amplifi:18,amz:7,an:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,18,21,22,23,24,25,27],analysi:[0,6,7,12,15,16,18,24,26],analyt:[0,20,21,24,25],analyz:[0,7,14,16,17,18,21,24,25,26,27],anchor:[4,16],anderson:15,android:[10,15],ani:[2,4,5,6,8,9,10,13,14,15,16,18,20,21,22,23,24,27],anim:[5,6],ann:6,annot:11,anonym:10,anoth:[2,7,9,10,15,20,21,22],anotherexampl:16,anotherexmapl:16,answer:15,anyhow:21,anymor:24,anyon:21,anyth:[4,18,21,24],anywai:[9,21],anywher:[18,21],apache_error:10,api:[0,6,14,24,25,26,27],api_vers:18,app:[13,14,18,23],app_kei:18,app_secret:18,appear:[14,15,16,18,21,24],append:[2,13,14,16],appl:[13,21],applebot:13,applewebkit:10,appli:[13,14,15,16],applic:[7,8,10,14,16,18,23],appliedprivaci:10,approach:[0,9,20,21,24,25,26,27],appropri:23,ar:[2,4,6,7,8,9,10,13,14,15,16,18,20,21,22,23,24,25,27],arab:[6,14,15,17,24],arbitrari:[6,18,24],archiv:15,area:[6,14,23,27],aren:9,arg:7,argument:[4,8,14,16,24],armenian:6,around:[5,6,21],arpa:[10,12],art:23,articl:[0,15,20,24,25,26,27],articlebodi:8,articlelarg:15,artilc:20,asia:23,ask:[6,14,18,24],associ:[14,21,23],assum:[14,16,18,24],assur:7,astronaut:18,attach:[14,18,23],attack:15,attempt:16,attent:12,attitud:18,attr:16,attract:23,attribut:[4,14,16,18,21,24],au:14,audit:[0,3,13,15,16,25],auditdetail:23,australia:14,auth_endpoint:18,auth_param:18,authent:[0,12,14,23,24,25,26],author:[14,16,18,20,23],author_url:16,autocomplet:[15,27],autom:[4,7,13,27],automat:[0,3,14,23,25,27],avail:[2,4,7,8,10,11,14,15,16,17,18,20,21,23,24,27],avocado:5,avoid:20,aw:15,await:23,axi:10,azerbaijani:[17,24],b023:15,b0aef497:16,b935:15,b:[6,7,10],bY:2,back:[10,18,21,27],backend:[7,16],bad:24,bag:21,baiduspid:[10,13],ban:4,banana:21,bandwidth:7,banner:19,barcelona:9,base:[0,2,3,5,7,11,14,16,18,21,23,24,25,27],basebal:23,basi:7,basic:[4,7,9,12,15,20,27],basketbal:[5,23],batteri:4,bbc:[13,15],bbc_sitemap:15,beacon:7,bearer:18,beat:21,beauti:23,becam:21,becaus:[8,10,12,13,16,18,20,21],becom:[2,10,16,20,21],been:[4,15,18,21,23],beer:18,befor:[4,6,14,16,18,21,23],beforehand:21,begin:[18,22,24],behalf:[14,23],behavior:[0,7,15,23,24,25,26,27],behaviour:16,behind:21,being:[14,15,16,18,20,21,23,24,27],belong:[8,12,15,18],below:[8,14,16,21,22,23],ben:15,benefit:[2,20,27],bengali:[17,24],benton:15,besid:21,best:[14,18,21],better:[4,15,16,18,20,24,27],between:[4,9,10,14,15,16,21,22,23,27],beyond:21,bid:19,big:[4,9,10],bill:[8,14],bing:8,bingbot:[10,13],bitcoin:6,black:[14,16,21],blob:16,block:[4,10,13,15,16],blockblob:16,blocked_url:10,blog:20,bloomberg:27,blowjob:6,blown:21,blue:[5,6,14,20,21,23],blueberri:5,bmw:[1,9],boat:[14,23],bodi:[5,6,7,16,18,27],body_text:[16,24],book:[5,21],bool:[1,2,6,9,15,16,18,20,21],boost:14,boss:6,bot:[10,12],both:[6,9,14,16,18,21,22,23,27],bottom:[9,21,27],bounc:[16,21],box:[5,13,15,23],brace:1,bradford:6,brand:[6,8,10,15],brandingset:23,broad:9,broadcast:[14,23],broken:18,brown:14,browser:8,bud:16,bug:[15,24],bui:[9,13],build:[5,7,10,27],builder:[0,24,25,26],built:27,bulgarian:14,bulk:[0,24,25,26],bunch:16,buscador:8,busi:[15,23],butt:15,c01e:16,c2coff:14,c:[4,7,17],c_fill:15,ca:[14,21],cach:[7,16],call:[1,14,15,16,18,20,21,24,27],camp:16,campaign:[0,1,19,24,25,26],campaign_nam:9,can:[0,2,3,5,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,24,25,27],can_fetch:13,cannot:[18,21],canon:[4,7,16,24],canonical_par:4,cantant:8,capit:[1,2,8,9],capitalize_adgroup:[9,24],captial:2,caption:[14,23,24],captions_list:23,captur:[15,27],car:1,caramel:6,card:[16,18,24],card_uri:18,care:13,career:[9,13],carrot:5,casual:23,cat:5,catalan:[14,17,24],categor:[10,20],categori:[1,14,15,20,23],categoryid:23,cater:10,caus:[18,24],cc_attribut:14,cc_noncommerci:14,cc_nonderiv:14,cc_publicdomain:14,cc_sharealik:14,cdn:7,celebr:15,center:[14,23],certain:[0,3,6,7,8,10,12,13,15,16,17,20,21,24,25],certainli:10,certif:9,cgi:7,chain:16,chanc:8,chang:[2,4,10,13,14,16,21,27],changefreq:15,channel:[14,23,24,27],channel_id:14,channel_sections_list:23,channelid:[14,23],channelplaylistvideo:23,channels_list:23,channelsect:23,channeltyp:[14,23],charact:[2,6,14,18,21,22,23,24],characterisit:10,charset:[4,7,16,24],chart:23,chat:6,cheap:9,cheat:24,check:[4,6,7,8,9,10,12,13,14,15,16,21,27],checker:[0,24,25,26],child:23,china:15,chines:[14,17,23,24],choic:5,choke:6,chokkattu:15,choos:[14,16,23],chose:10,chosen:10,christian:23,christma:15,chrome:[8,10],chronolog:[14,23],cinta:1,circl:5,circular:[14,23],citi:[1,8],ckaiserjr:6,claim:12,clarif:24,classic:23,classifi:23,clean:27,clear:[8,9,18],clearli:[9,20],click:27,client:10,client_arg:18,cline:15,clipart:14,close:4,closedcapt:[14,23],closespider_errorcount:[4,16],closespider_itemcount:[4,16],closespider_pagecount:[4,16],closespider_timeout:[4,16],cloth:5,cloudflar:[7,16],cloudfront:15,clover:5,club:[9,27],clue:13,cm:[14,23],cn:14,co:6,code:[0,4,5,6,8,10,14,15,16,18,19,23,24,25,26,27],code_recip:[0,24,25,26],codepoint:5,coffe:6,cohort:7,collect:[11,13,14,18,23,24],collin:15,collinss:15,colliss:20,color:[14,16,20,21],column:[4,6,7,8,9,10,13,14,15,16,18,20,21,24],com:[4,5,6,7,8,10,12,13,14,15,16,18,19,20,23],comand:12,combin:[8,9,10,11,13,14,16],come:[2,9,10,21],comma:[14,18,21,22,23],command:[4,10,12,13,25],comment:[13,16,23,24,27],comment_threads_list:23,comments_list:23,commentthread:23,commerc:[9,21],common:[7,10,14,23],common_with_vhost:10,commun:[4,20,27],compani:[6,8,13],compar:[15,20],comparison:[8,12],compat:[10,18],compil:11,complet:[6,9,14,18,20,21,23],complex:[10,18],complic:18,compon:[7,10,18,20,24],comprehens:27,compress:[10,24],comput:[4,10,16],concat:[10,16],concaten:15,concurr:[0,3,14,23,24,25],concurrent_item:4,concurrent_request:4,concurrent_requests_per_domain:[4,16],concurrent_requests_per_ip:4,condit:[0,3,10,16,25],conduct:13,confid:16,configur:[16,23],conform:10,conformig:10,conglomer:8,congression:15,conjunct:[14,18,23],connect:[4,13,18,24,27],consecut:[4,16],consid:[6,18,23],consider:[2,21,27],consist:[2,4,9,10,18,20,21,24],consol:[0,14,20,23,25],constrain:[14,23],consum:[7,18],consumed_onli:18,contaboserv:10,contain:[4,5,6,7,8,9,10,13,14,15,16,18,20,21,22,23,24,27],content:[4,7,8,13,14,15,16,17,20,21,23,24,26],contentdetail:23,contentownerdetail:23,contenturl:8,context:[6,8,11],continu:[7,27],contrast:6,contributornameid:16,control:[0,3,7,14,16,24,25,27],conveni:27,convert:[2,10,16,20,24,27],cookbook:11,cool:27,coordin:[14,23],copi:[0,3,25,27],copyright:[16,17],core:10,corn:5,coronaviru:15,corpor:8,corpu:21,correct:[6,8,24],correctli:2,correspond:15,cost:23,could:[6,7,14,21,23,24],count:[0,1,5,6,10,12,13,15,18,22,24,25,26,27],counti:15,countri:[5,14,16,20,23,24,27],countryau:14,countryuk:14,cours:[7,9,21],coverag:24,covid:15,cpu:10,cq:15,cr:14,crash:16,crawl:[0,3,7,12,13,20,24,25,26,27],crawl_df:[7,16],crawl_head:[7,24,27],crawl_logs_df:10,crawl_logs_to_df:10,crawl_tim:[7,16],crawler:[0,4,7,10,24,25,26,27],crawllogs_to_df:[10,24],cream:6,creat:[0,4,5,7,8,9,14,18,20,23,24,25,26,27],creation:27,creativ:[14,23],creativecommon:[14,23],credenti:[8,14,18,23],credibl:18,cricket:23,criteria:23,criterion:9,critic:[8,14],croatian:[14,17,24],crossorigin:[16,24],crowd:14,cse:24,css:[0,4,24,25,26,27],css_link:4,css_selector:[16,24],csv:[6,10],ct:[7,16],ctrl:4,cultur:15,cultura_sociedad:15,cum_count:[10,12],cum_perc:[10,12],cumul:[12,21],cup:6,curat:23,currenc:[0,21,24,25,26,27],currency_summari:6,currency_symbol:6,currency_symbol_count:6,currency_symbol_freq:6,currency_symbol_nam:6,currency_symbols_flat:6,currency_symbols_per_post:6,current:[4,10,15,16,18,23,24,27],cursor:18,custom:[0,3,7,10,14,24,25,26,27],custom_set:[4,7,10,16,24],customiz:16,cutom_set:4,cx:14,czech:14,d4889b15:15,d74930cf:15,d76b68d148ddec1efd004:16,d9646265:10,d99f2368:16,d:[6,7,10,14],d_placeholder_thescen:15,dai:[4,6,14,18,23],danish:[14,17,24],dark:5,dash:[10,24],dash_html_compon:10,dashboard:[18,27],dashboardom:7,data:[0,6,7,9,13,14,15,20,24,25,26,27],databas:[5,6,10,11,24,27],datacamp:27,datafram:[0,5,6,9,13,14,15,16,18,20,21,24,25,26,27],dataset:[6,16,20,21,27],date:[10,13,14,15,16,18,23,24,27],daterestrict:14,datetim:[10,14,15,23,24],datetime64:15,david:15,db:24,dd:18,ddthh:23,de:[1,4,8,9,16],deal:27,death:15,debug:[10,14],debut:15,dec:15,decid:[15,16,18],decis:[7,15,27],decod:20,decrib:16,deep:16,default_request_head:16,defeat:15,defin:[8,10,14,21,23,24],definit:[14,23],deflat:[7,16],delai:13,delimit:[20,22],deliveri:27,demot:[14,23],denot:13,depend:[6,7,8,9,15],deprec:[23,24],depth:[0,3,7,16,25],depth_limit:[4,16],desc_text:2,descend:[14,23],describ:[9,21],descript:[0,4,6,8,9,16,18,20,21,23,24,25,26,27],design:[9,13],desir:[10,18],desktop:10,destin:[10,20],detail:[2,7,9,10,13,14,16,18,23,27],detaileddescript:8,detect:18,determin:[0,9,14,21,24,25,26],develop:[5,8,13,14,18,23],df:24,di:[0,3,25],diamond:5,dict:[7,10,16],dict_kei:[5,6,17],dictionari:[4,5,6,7,16,17,24],did:[6,15,21],didn:27,differ:[2,4,5,6,8,9,10,11,13,14,15,16,18,20,21,23,27],differenti:19,difficult:9,digit:[0,27],dimens:[14,23],dir_1:[15,20],dir_2:[15,20],dir_3:[15,20],dir_4:15,dir_5:15,dir_6:15,dir_7:15,direct:[7,13],directli:18,directori:[0,24,25,26],disabl:14,disabled0:14,disallow:[13,16],disambigu:18,discordbot:13,discount:9,discov:[4,10,16,20,27],discoveri:[0,24,25,26],discreet:18,discuss:6,diseas:15,disk:10,dislik:23,displai:[6,10,13,14,23],dist:18,distanc:[14,23],distinct:18,distinguish:[10,16],distort:20,district:15,divers:27,divid:[2,21],dn:[0,10,24,25,26],doc:[8,18],document:[7,8,14,16,18,21,24],documentaion:16,doe:[2,4,5,6,12,13,14,15,16,21,22,23,27],doen:10,doesn:[4,9,10,16,21],dog:5,dollar:[6,22],domain:[0,3,7,10,12,13,14,16,20,24,25],domin:14,don:[0,1,3,6,7,10,14,16,20,21,24,25,27],done:[4,7,9,10,14,15,20,21,27],dot:[21,22],dotbot:10,down:[0,3,9,10,21,24,25,26,27],downgrad:7,download:[0,4,7,13,16,20,23,24,25,26,27],download_d:[13,15,24],download_delai:[4,16],download_lat:[7,16],download_slot:[7,16],download_timeout:[7,16],download_timout:16,dp8hsntg6do36:15,dr:10,draggabl:[16,24],drink:[5,6],drive:8,drizzl:6,drop:24,drop_dupl:13,dtype:[8,10,13,15],dubai:1,due:[6,10,18,21,23],duplic:[4,12,14,16,18],durat:[14,23],dure:[14,21],dutch:[14,17,24],duti:15,dwgyu36up6iuz:15,dynam:[7,16],e01:16,e7e15811c65f406f89f89fe10aef29f5:15,e:[1,7,9,14,16,19,21,23,24],each:[1,2,5,6,8,9,10,11,12,13,14,15,16,17,18,20,21,22,23,24],ear:5,earliest:23,earth:18,easi:[7,9,15,20,24,27],easier:[4,6,9,16,18,20,24,25,27],easiest:15,easili:[2,7,10,13,15,17,18,20,27],ed:11,editor:15,educ:9,ee0djx6z511tgx88:7,effect:[10,18,20],effici:[7,10,12,16],effort:18,eggplant:5,eight:21,eighti:13,either:[6,9,10,14,15,18,21,23,24],elabor:20,elect:15,electron:23,element:[0,2,4,6,7,8,24,25,26,27],element_1:24,element_2:24,eleven:21,eli:16,eliasdabba:5,elig:8,eln:15,els:[2,8,18,21],elsewher:21,email:[8,19],emb:23,embed:[14,18,23],embedd:[14,23],embedhtml:23,emerg:4,emo:16,emoji:[0,16,21,24,25,26,27],emoji_:27,emoji_count:[5,6],emoji_df:[5,24],emoji_entri:5,emoji_flat:[5,6],emoji_flat_text:[5,6],emoji_freq:[5,6],emoji_nam:6,emoji_per_post:[5,6],emoji_raw:5,emoji_search:[5,24,27],emoji_summari:[5,6],emoji_text:[5,6],emot:[5,6],empti:[2,4,5,6,20,21,24],en:[4,7,8,15,16,18,20,23],en_u:23,enabl:[8,14],encod:[7,16,18,19,20],encount:[10,20],encourag:18,end:[2,6,7,14,16,20,22,24,27],engag:18,engin:[0,7,8,9,10,13,15,24,25,26,27],english:[14,17,20,21,24],enhanc:20,enjoi:6,enough:[2,9,14,21,23],ensur:[2,16],enter:[14,16],entertain:23,entir:[14,18],entire_words_onli:6,entiti:[0,8,13,15,18,24,25,26,27],entri:5,env:10,environ:18,episod:[14,23],equal:[10,18,20],equival:[12,16],errback:7,errno:[10,12],error:[1,4,10,12,14,16,23,24],errors_fil:10,es:[8,20],escap:[14,23],espada:1,especi:[2,4,9,13,15,21],essenti:[21,22,27],estonian:14,etag:[13,15,24],etaospid:13,etc:[4,5,6,8,9,10,11,14,15,16,17,20,21,22,24,27],eur:6,euro:6,european:27,evalu:8,even:[10,13,14,15,16,18,21,23,24],event:[10,14,15,20,23],eventtyp:[14,23],ever:[14,21],everi:[10,13,15,16,18,21,23,27],everyon:[6,21],everyth:[8,18,21],everywher:21,exact:[4,9,18],exactli:[2,5,23],exactterm:14,exampl:[2,4,6,7,8,9,10,13,14,15,16,18,20,21,22,23,24,27],example_crawl_1:4,excalam:6,exce:[1,2],except:[4,18,20,21],excit:6,exclam:[0,22,24,25,26],exclamation_mark:6,exclamation_mark_count:6,exclamation_mark_freq:6,exclamation_mark_nam:6,exclamation_marks_flat:6,exclamation_marks_per_post:6,exclamation_summari:6,exclamation_text:6,exclud:[9,14,16,18,20,23,24,27],exclude_repli:18,exclude_url_param:[16,24],exclude_url_regex:[16,24],excludeterm:14,exclus:[14,23],exec:13,exist:[5,6,9,10,18],exit:10,exmapl:[4,7,16,20,27],expand:24,expect:[5,7,16],expens:7,experi:21,explain:[15,27],explan:16,explanatori:20,explicitli:[14,18,20],explod:15,explor:[5,6,15,16,17,18],exploratori:[4,16],explosionai:17,exposur:15,express:[0,3,5,6,9,10,13,14,16,21,24,25,26,27],ext_alt_text:18,extend:[10,18],extens:[4,10,13,14,24],extern:[7,10],extra:[2,10,21],extra_info:21,extract:[0,3,10,13,20,24,25,26,27],extract_:[6,24,27],extract_curr:[6,24],extract_emoji:[5,6,24],extract_exclam:[6,24],extract_hashtag:[6,24],extract_intense_word:[6,24],extract_ment:[6,24],extract_numb:[6,24],extract_quest:[6,24],extract_url:[6,24],extract_word:[6,24],extrem:[4,7,9,16,27],ey:13,f53301c8286f9bf59ef297f0232dcfc1:15,f:10,face:[5,14],facebook:[0,13,19,21,24,25,26],facebookbot:10,facebookexternalhit:13,failur:7,fairli:20,fall:[8,14,18,23],fallback:1,fals:[1,2,4,6,9,10,13,15,16,18,20,21,24],famili:[10,18],familiar:15,fashion:23,fast:[7,12,24],faster:[15,24],fastest:15,fatal:15,favorit:[1,6,18,21],fb_robot:13,fb_test:13,fb_userag:13,fe546b9b:15,featur:[2,14,15,18,23,24,27],feb:[7,10],februari:[15,23],feed:[0,23,24,25,26],feel:[5,6,24],fetch:[13,16,24],few:[4,6,7,10,15,16,20,21,27],fewer:2,field:[10,14,23,24],fifteen:[9,21],fifti:21,figur:[13,16,18,27],file:[0,1,4,7,12,14,15,16,24,25,26,27],filedetail:23,filepath:16,filetyp:14,fill:14,filter:[10,14,15,18,20,23,24],filter_to_owned_list:18,find:[4,5,6,14,16,18,20,21,23,27],fine:16,finger:5,finish:4,finnish:[14,17,24],fire:6,first:[2,4,6,8,13,14,15,16,18,20,21,22,23,24],fish:[14,23],fit:[2,23,24],five:[2,13,16,20,21],fix:[10,16,24],fl_progress:15,flag:[5,6],flat:[5,6],flavor:6,flex:13,flexibl:16,flight:[14,18],fligt:14,float64:15,focu:[9,12,27],focus:14,folder:4,follow:[0,2,3,5,6,7,10,14,15,17,18,20,21,23,24,25,26,27],follow_link:[4,7,10,16,24],followers_count:6,food:[5,6,23],footbal:[5,9,15,23,27],footer:[4,16,24],footer_links_href:4,footer_links_text:[4,16],footer_links_url:16,footnot:17,forc:18,forchannelid:23,forcontentown:[14,23],fordevelop:[14,23],form:[6,8,21],format:[0,1,2,7,9,11,13,14,16,18,23,24,25,26,27],former:21,formerli:21,formin:[14,23],forth:[14,18,23],forti:[21,27],forusernam:23,forward:7,found:[4,10,14,15,18],four:[5,6,13,14,16,20,21,23],fr:[8,14,16],fraction:16,frag_1:20,frag_2:20,fragment:[15,20],frame:9,franc:14,free:14,freebas:[14,23],freixo:1,french:[14,17,24],freq:15,frequenc:[0,5,6,12,24,25,27],frequent:21,fri:7,friend:18,from:[0,3,8,10,11,12,13,14,15,16,18,20,21,22,23,24,25,26,27],front:[6,21],fruit:5,ft:[14,23],fucntion:6,full:[1,4,5,7,9,15,16,18,21,24,27],fulli:[5,6,18],func:18,funcion:8,further:[16,20,21],futur:[18,23],g:[1,7,14,16,19,23,24],g_face:15,gadget:2,gain:[15,25],galaxi:15,game:23,garda:12,gecko:10,gener:[0,6,10,13,16,19,20,21,23,24,25,26,27],genr:15,geocod:18,geograph:[14,23],geoloc:14,geometr:5,georgia:15,geotag:18,german:[14,17,24],gestur:5,get:[0,1,2,4,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,24,25,26,27],get_application_rate_limit_statu:18,get_available_trend:18,get_favorit:18,get_followers_id:18,get_followers_list:18,get_friends_id:18,get_friends_list:18,get_home_timelin:18,get_list_memb:18,get_list_membership:18,get_list_status:18,get_list_subscrib:18,get_list_subscript:18,get_mentions_timelin:18,get_place_trend:[18,24],get_retweet:18,get_retweeters_id:18,get_supported_languag:18,get_user_timelin:18,gideon:15,give:[4,6,7,9,12,14,16,18,20,21],given:[2,4,13,14,15,16,18,20,24],gl:14,global:[16,18,24],glove:5,gmail:8,gmbh:17,gmt:[7,16],go:[6,7,9,10,13,14,15,16,21,24],goe:[4,15],golf:23,good:[2,4,6,10,12,15,16,20],googl:[0,10,12,13,20,23,24,25,26,27],googlebot:[10,12,13],googletagmanag:4,googtwfb:13,got:16,gp:13,gr:10,grai:14,gram:[0,24,25,26],granular:16,graph:[0,16,24,25,26],graphic:9,grayscal:14,great:[1,6,16,20,27],greater:18,greek:[6,14,17,24],green:[6,14,21],grin:5,group:[2,5,6,9,13,24,27],groupbi:13,gtm:4,gtm_noscript:4,gtm_script:4,guarante:18,guid:[5,23],guide_categories_list:[23,24],guidecategori:23,guitar:9,gunicorn:7,gwnlj8m99yumucgdd6ytm:7,gx12:2,gz:[15,24],gzip:[7,16],h1:[4,16],h2:[4,16,24],h3:[4,7,16],h4:4,h5:4,h6:[4,16],h:[6,10,24],h_180:15,ha:[2,4,6,9,13,15,16,18,20,21,23,24,27],haaatttteee:6,had:[4,5,6,21],hahahahahahaha:6,haiku:18,half:21,han:[14,23],hand:[5,8,9],handl:[4,10,12,13,14,18,24,27],handler:10,hant:[14,23],happen:[4,10,20],happi:[10,18],hard:[0,3,25],hash:20,hashtag:[0,11,13,18,21,24,25,26,27],hashtag_count:6,hashtag_freq:6,hashtag_raw:11,hashtag_summari:6,hashtags_flat:6,hashtags_per_post:6,hate:18,hauptstadt:8,have:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,24,27],hd:[14,23],he:[6,15,21],head:[5,6,7,9,10,13,15,16,24,25,27],header:[0,4,13,15,16,24,25,26,27],header_links_href:4,header_links_text:[4,16],header_links_url:16,headers_df:7,headers_spid:7,headersspid:7,headlin:27,health:[2,23],heart:5,hebrew:[14,17,24],height:[16,23,24],heldforreview:23,hello:[5,6,13,16],help:[4,6,7,10,12,14,15,16,18,20,22,24,27],helper:[5,22],henc:21,her:21,here:[2,5,6,7,9,10,14,15,16,20,21,27],hereaft:21,herebi:21,herein:21,hereupon:21,herself:21,heru80fdn:15,hfubv4v3ai:6,hi:[6,15,21],hidden:21,hierarchi:8,high:[4,8,14,15,16,23],higher:[8,14,15,23,24],highest:[14,23],highli:[14,16,23,27],highrang:14,hilari:18,him:21,himself:[15,21],hindi:[15,17,24],hip:23,hit:[0,3,7,16,25],hl:[14,23],ho4kx7zz24:6,ho:8,hobbi:23,hockei:23,hodgeman:15,hol:10,hola:6,home:[13,23],home_timelin:18,honnib:17,hood:7,hop:23,hope:[6,27],hopefulli:27,hopewel:15,host:[10,12,14,24,27],host_df:[10,12],hostnam:[10,12,20],hot:[5,6],hotel:[1,5,14],hour:[4,18],hous:15,how:[0,2,3,5,6,7,9,13,15,16,18,20,21,24,25,26,27],howev:[10,14,18,21,23],howsearchwork:13,hp:13,hq:14,href:[4,16,24],hreflang:[4,7,24],ht:16,hte:15,htm:10,html:[4,7,10,13,15,16,18,20,23,24],http:[4,5,6,7,8,10,13,15,16,18,20],httperror_allow_al:7,huge:14,hulu:15,humor:23,hundr:[7,16,21],hungarian:[14,17,24],hurri:4,husband:6,hydrat:18,hyphen:2,i18n_languages_list:23,i18n_regions_list:23,i18nlanguag:23,i18nregion:23,i:[0,3,5,6,7,13,14,16,20,21,25,27],ia_archiv:13,ibmo9hrztai:7,ic:[6,23],iceland:14,icon:14,id:[4,7,8,14,16,18,23],idea:[4,6,9,16,21,27],ideal:[13,20,21,27],ident:18,identifi:[14,16,18,20,23],ifram:4,iframe_src:4,ignor:21,imag:[7,8,10,13,14,15,16,18,24],image_loc:15,img:[16,24],img_:16,img_alt:16,img_src:16,imgcolortyp:14,imgdominantcolor:14,imgr:13,imgsiz:14,imgtyp:14,immedi:[13,18],implement:24,importantli:[10,20,27],improv:[14,21,24],inc:8,includ:[0,3,6,9,10,13,14,15,16,18,20,22,23,24,25,27],include_card_uri:18,include_ent:18,include_ext_alt_text:18,include_rt:18,include_url_param:[16,24],include_url_regex:[16,24],include_user_ent:18,includesubdo:16,includesubdomain:7,inclus:[14,23],inconsist:20,inde:21,independ:23,indepent:16,index:[0,7,8,10,14,16,18,24,26,27],india:15,indic:[4,7,13,14,16,18,20,23,24],individu:[14,23],indonesian:[14,17,24],industri:[13,14,15,27],infer:6,influenti:18,info:[10,14,24],inform:[5,7,8,10,12,14,15,18,20,21,23,24,27],inherit:8,initi:[4,8],input:[1,2],insensit:[5,24],insert:[1,20],insid:22,insight:[0,4,15,21,24,25,26,27],instagram:18,instal:25,instanc:[6,8],instant:[0,24,25,26],instead:[6,13,16,18,20,21,23,24],instruct:[13,14,23],int64:[10,13,15],intact:2,integ:[2,14,23],integr:9,intend:[14,18,23],intens:[6,24],intent:[9,27],interact:[15,18],interest:[6,7,8,9,10,13,15,16,21,25],interfac:[7,14,18],interior:18,intern:[7,14,15,16,18],internacion:15,internation:14,internet:15,interv:[4,27],interview:15,introductori:27,invalid:24,invert:6,inverview:15,investig:4,invideopromot:23,io:[7,16,18],iowa:15,ip:[10,12,14,16,24,27],ip_address:[10,12,16],ip_host_dict:10,ip_list:12,ipaddrlist:[10,12],ir88:15,ir:12,iran:15,iraq:15,irish:[17,24],ismap:[16,24],iso:[8,14,18,23],issu:[4,24,27],italian:[14,17,24],item:[4,9,14,16,18,20,23,24],item_a:16,item_b:16,iter:2,its:[0,1,3,5,7,8,9,10,15,16,18,20,21,23,25],itself:[10,16,20,21],iyl50:7,ja:18,janeiro:9,japanes:[14,17,24],java:10,javascript:4,jazz:23,jenni:6,ji:8,jin:8,jl:[4,7,10,13,16,24],job:[0,3,9,25,27],jobdir:4,john:6,join:[6,16],jpeg:7,jpg:15,jpy:6,js:[4,10],js_script_src:4,js_script_text:4,json:[7,10,14,16,18,24],json_norm:[10,24],jsonld_1_:16,jsonld_:16,jsonld_error:24,jsonlin:[7,16],julian:15,jung:8,jungl:8,just:[2,5,6,10,14,16,18,21,27],k:[10,16,21],ka:15,kaggl:[5,27],kang:8,kansa:15,kazakh:[17,24],keep:[1,4,5,8,9,12,13,16,18,21,24,27],kei:[4,5,6,8,14,16,17,18,20,21,23,24],key_nam:6,keyword:[0,5,8,16,17,21,24,25,26,27],keywords_df:9,kfpdr3hupi:6,khtml:10,kid:6,kill:4,kilomet:[14,18,23],kind:[7,16,24,27],kiwi:21,km:[14,18,23],know:[2,6,9,10,16,20,27],knowledg:[0,23,24,25,26],knowledge_graph:[8,24],known:[7,16,18,21,24,27],korea:8,korean:[8,14],kw_:[16,24,27],kw_broad:9,kw_df:9,kw_exact:9,kw_gener:[9,16,24,27],kw_modifi:9,kw_neg_broad:9,kw_neg_exact:9,kw_neg_phras:9,kw_phrase:9,kwarg:[6,7],l1:16,lab:15,label:9,lamborghini:1,land:[2,9,27],lang:[13,18],lang_:14,lang_ar:14,lang_bg:14,lang_c:14,lang_ca:14,lang_d:14,lang_da:14,lang_el:14,lang_en:14,lang_et:14,lang_fi:14,lang_fr:14,lang_hr:14,lang_hu:14,lang_i:14,lang_id:14,lang_it:14,lang_iw:14,lang_ja:14,lang_ko:14,lang_lt:14,lang_lv:14,lang_nl:14,lang_no:14,lang_pl:14,lang_pt:14,lang_ro:14,lang_ru:14,lang_sk:14,lang_sl:14,lang_sr:14,lang_sv:14,lang_tr:14,lang_zh:14,languag:[0,7,8,9,14,15,16,18,20,21,23,24,25,26,27],larg:[0,4,5,10,12,14,15,16,21,24,25,26,27],larger:[14,18,23],last:[1,2,6,13,15,16,20,21,24],last_dir:[15,20,24],lastmod:15,lat:18,latenc:7,later:[0,3,10,15,25],latest:[1,2,16,18],latin:23,latitud:[14,18,23],latter:21,latterli:21,latvian:14,layout:[10,23],ld:[7,16,24],lead:14,leaf:5,learn:[9,15,16,21,23],leas:16,least:[14,21,23],leav:[2,13],left:[4,6,23],left_char:6,len:2,lenght:24,length:[1,2,7,15,18,20,21,22],less:[14,16,18,21,23],let:[1,2,6,8,9,13,14,15,16,21,23],letter:[2,5,14,23],level:[4,10,14,16,18,20,23],level_or_nam:14,li:[16,24],licens:[8,14,23],life:[6,25],lifestyl:23,light:[5,7],like:[5,6,7,8,9,10,12,14,15,16,18,21,23,24,27],likelyspam:23,lilguyisback:6,limit:[1,2,8,13,14,16,18,23,27],line:[1,7,8,10,12,13,14,16,25],lineart:14,lineup:6,link:[0,3,6,7,14,15,18,20,23,24,25,26,27],link_rel_href:4,link_rel_rel:4,link_rel_stylesheet:4,linkedin:13,linkedinbot:[10,13],links_frag:24,links_href:16,links_nofollow:[16,24],links_text:[16,24],links_url:[16,24],linksit:14,linux:[10,24],lisbon:1,list:[0,1,2,3,5,7,8,9,10,12,13,14,15,17,18,20,21,22,23,24,25,26,27],list_id:18,liter:8,lithuanian:14,littl:[20,25,27],live:[14,23],livestreamingdetail:23,ll:[6,13,18,21],load:[10,16,24],loc:15,local:[14,18,23],locat:[14,15,18,20,23,27],locationradiu:[14,23],log:[0,3,12,14,15,16,23,26,27],log_error:10,log_field:10,log_fil:[4,10,16],log_format:10,logic:14,login:[10,13],logs_df:10,logs_file_path:10,logs_to_df:[0,24,25,26],lokal:8,lol:6,lon:18,longdesc:[16,24],longer:[1,2,6,14,21,23,24],longitud:[14,18,23],look:[2,9,15,21],lookout:7,lookup:[0,10,18,24,25,26],lookup_statu:18,lookup_us:18,looooooovvvve:6,looooooveee:6,loop:[14,18,24],loos:6,lose:13,lost:[2,4],lot:[2,7,10,15,20,27],love:[5,18,21],love_emoji:5,lower:16,lowest:[14,23],lowrang:14,lr:14,luxuri:9,m:[6,10,13,14,15,23],ma:[7,16],machin:15,made:[6,12,18,21],mai:[10,13,14,16,18,21,23],mail:12,main:[2,8,13,14,15,16,18,20,21,24,27],mainli:[4,9,12,13,21,22],mainten:7,major:[10,13,15,18,27],make:[0,1,2,3,6,7,9,10,12,13,14,15,16,18,20,21,24,25,27],make_datafram:18,mammal:5,manag:[4,7,14,18,23,27],managedbym:23,mango:21,mani:[1,2,4,5,6,8,9,10,12,13,14,15,16,18,20,21,23,27],manipul:27,manner:[8,20],manual:4,map:[6,8,9,16,18,27],march:15,mark:[6,18,20,21,22,24],market:[0,8,9,14,16,19,24],martial:23,marvinmilton2:6,masscan:10,massiv:[10,12],master:[4,7,16],match:[5,6,8,9,10,14,16,18,23,24],match_typ:9,matter:9,matthew:17,max:[7,16],max_column:10,max_id:18,max_len:[1,9],max_work:[12,15,24],maxheight:23,maxim:18,maximum:[1,2,8,9,12,14,15,16,18,23],maxresult:[14,23],maxwidth:23,mayb:[6,9,13],mb:24,mckinlei:15,mckinleyd:15,me:[21,22],mean:[6,7,8,9,10,13,14,16,18,20,21,27],meaning:[15,21],meanwhil:21,measur:[4,14,23,24],media:[5,6,10,16,17,18,20,21],medium:[5,14,19,23],meet:[6,14,23],mega:15,megabyt:27,member:18,membership:18,memori:[10,16],mention:[0,8,11,18,20,21,24,25,26,27],mention_count:6,mention_freq:6,mention_raw:11,mention_summari:6,mentions_flat:6,mentions_per_post:6,mentions_timelin:18,merced:1,merg:[14,16,18,24],messag:[10,24],meta:[4,7,14,16,18,20],meta_desc:[4,16],metadata:[14,18,23,24],metallica:6,metatag:7,method:[7,10,14,16,18,23,25,27],method_from:10,method_to:10,metric:21,mi:[14,18,23],middl:24,middleeast:15,middlewar:10,might:[2,4,5,6,7,9,10,13,14,15,16,20,21,23,25,27],mile:18,militari:23,miller:15,million:21,min:10,min_rep:6,mind:[4,5,8,16,18,27],mine:[17,21,22,23,27],mini:7,minnesota:15,minor:[10,24],minu:16,minut:[14,15,23],miss:[2,6,15,24],missouri:15,mistak:13,mix:[18,20,23],mj12bot:10,mm:[15,18,23],mmb29p:10,mobil:10,mocha:6,mode:[0,3,6,18,24,25,26],model:[2,10,15],model_a:16,model_b:16,moder:[14,23],moderationstatu:23,modifi:[5,6,7,9,13,15,16,17,18,21],modul:[1,6,16,21,24,25,26,27],monitor:27,mono:14,month:[14,15,18],more:[2,4,5,6,7,8,9,10,13,14,15,16,18,20,21,23,24,27],moreov:21,morn:6,most:[1,2,4,6,7,9,10,14,15,16,18,21,23,27],mostli:[4,16,20,21,27],mostpopular:23,motorsport:23,move:21,movi:[14,15,18,23],mozilla:[10,16],mp4:15,mpu:19,ms:[10,16],msg:24,msnbot:13,much:[15,16,21,24],multi:[12,14],multimedia:15,multin:8,multipl:[0,3,6,8,13,14,15,16,24,25,27],multipli:21,mundo:15,music:23,must:[10,14,18,21,23],my:[0,1,3,6,16,21,25],my_output_fil:16,myrat:23,myrecentsubscrib:23,myself:21,mysit:19,mystuff:13,mysubscrib:23,n:[0,24,25,26],na:[20,24],name:[1,4,5,6,7,8,9,10,12,13,14,15,16,18,19,20,21,23,24,27],name_1:16,name_2:16,nan:[7,8,10,15,16,20],narrow:23,nasa:18,nat:[13,15],natali:15,nativ:18,native_video:18,natur:[5,6],nav:[4,16,24],nav_links_href:4,nav_links_text:[4,16],nav_links_url:16,naverbot:13,navig:18,ncov:15,nearli:6,nebraska:15,need:[1,2,4,6,7,8,9,10,12,13,14,16,18,21,27],neg:[6,9,18],neither:21,nepali:[17,24],nest:[18,23],net:[10,15],netloc:[15,20],network:[6,20],never:[6,21],nevertheless:21,newest:[15,23],news_keyword:15,news_publ:15,news_publication_d:15,news_titl:15,next:[6,9,16,21,23,27],next_cursor:18,nextpagetoken:[14,23,24],nexu:10,nfl:15,nginx:[7,16],nginx_error:10,nh:15,nine:21,nippli:6,nl:10,nobodi:21,node:18,nofllow:16,nofollow:[16,24],noindex:7,non:[10,14,21,22,23,24,27],none:[2,5,6,7,8,10,13,14,16,18,19,21,23],noon:21,nor:21,normal:[10,17],norwegian:[14,17,24],nose:15,note:[2,6,8,14,16,18,20,21,23,27],notebook:27,noth:[6,21],notic:[6,13],noticia:15,notset:14,noun:9,now:[1,2,6,9,10,13,15,16,18,21,24],nowher:21,np:15,ns:[4,15],nt:[10,16],num:14,num_currency_symbol:6,num_emoji:[5,6],num_exclamation_mark:6,num_hashtag:6,num_list:[21,24],num_ment:6,num_numb:6,num_post:[5,6],num_question_mark:6,num_url:6,num_word:6,number:[0,3,5,8,9,12,13,14,15,16,18,20,21,23,24,25,26,27],number_count:6,number_freq:6,number_of_emoji:5,number_of_hashtag:6,number_of_ment:6,number_of_numb:6,number_of_symbol:6,number_of_url:6,number_of_word:6,number_separ:6,number_summari:6,numbers_flat:6,numbers_per_post:6,numer:[18,23],nutch:10,nyt:15,nyt_new:15,nytim:15,nz:14,o:11,oauth_token:18,oauth_token_secret:18,oauth_vers:18,obama:15,obei:[0,3,10,25],obido:13,object:[5,6,8,10,15,16,18,23,27],obtain:[18,20,21],occur:[6,15,16,18,21,23,24],occurr:[6,21],odai:6,off:[4,14,21],offer:[9,18],offic:6,often:21,og:[4,16,24],og_cont:4,og_prop:4,ohio:15,ok:7,okai:6,older:18,oldest:18,omit:18,onbehalfofcontentown:[14,23],onbehalfofcontentownerchannel:23,onc:[2,4,8,9,10,14,15,16,18,20,21,23,25,27],one:[1,2,4,5,6,8,9,10,11,13,14,15,16,18,20,21,23,24,27],ones:[5,6,7,10,12,15,16,21],ongo:[14,23],onli:[0,1,3,6,7,10,11,13,14,15,16,18,19,21,23,24,25,27],onlin:[2,16],onto:21,open:[10,13,15,16,24],opengraph:[4,7],oper:[10,14,15,18,23,24],oppos:[9,20,24],opposit:6,opt:18,optim:[7,8],option:[2,4,6,7,9,10,13,14,16,17,18,20,21,22,23,24,27],orang:[14,21],order:[6,8,9,14,16,23],order_matt:9,org:[5,7,8],organ:8,origin:[4,10,14,16,20,24],orterm:14,other:[2,5,6,7,8,10,11,13,14,15,16,18,20,21,23,24,27],otherwis:[16,18,20,21],ottawa:15,ound:6,our:[2,6,10,18,21],ourselv:[10,21],out:[1,6,8,10,13,14,16,18,20,21,23,27],outpuf_fil:16,output:[7,10,16,18,24],output_fil:[4,7,10,13,16,24],outreach:27,outsid:[6,10,14,23],over:[4,7,15,16,18,21,24],overview:[2,5,6,12,15,27],overwrit:16,owen:15,own:[6,9,10,14,18,20,21,23,27],owner:[13,14,18,23],owner_id:18,owner_screen_nam:18,ownership:18,p:[16,24],packag:[16,17,24,25,26,27],page:[0,2,3,6,7,8,9,10,13,15,17,18,20,21,23,24,25,26,27],page_1:4,page_2:4,page_3:4,page_4:4,pagelet:13,pagemap:24,pagepostssectionpagelet:13,pagetoken:[14,23],pageview:[10,21],pagin:[24,27],pai:14,paid:6,pair:18,pakistan:15,pam:15,pamper:6,pand:24,panda:[5,6,7,9,10,13,15,16,18,24],panel:14,paper:5,param:27,paramet:[0,1,2,4,5,6,7,8,9,10,12,13,14,15,18,19,21,22,23,24,25,26,27],parent:[4,23],parenthes:22,parentid:23,parmet:16,parquet:[10,24],pars:[0,7,16,24,25,26,27],parser:27,part:[6,9,12,14,17,20,21,22,23,27],parti:18,partial:5,particular:[13,14,15,23],particularli:[14,16],partner:[14,23],pass:[4,8,13,14,15,16,18,27],past:[14,27],patch:10,patch_minor:10,path:[0,4,7,10,13,15,16,24,25,26],path_1:20,path_2:20,path_3:20,patienc:13,pattern:[0,6,13,15,20,21,25],paus:[0,3,25],pd:[6,7,10,13,15,16],penguinnyyyyi:6,peopl:[5,6,8,18,21,27],per:[5,6,14,15,18,21,27],perc:[10,12],percentag:[12,21,24],perform:[10,12,14,15,16,23],perhap:21,period:7,periscop:18,permiss:13,permut:9,perry_ron:6,persian:[15,17,24],person:[6,8,14],perspect:[16,20,21],pet:23,petalbot:10,phone:6,photo:[14,18],php:13,phrase:[9,14,18,21,22,24],phrase_len:[21,22,24],physic:23,pic:18,pictur:[15,21],piec:7,pink:14,pinterest:13,pinterestbot:13,pip3:[25,27],pip:[25,27],pipe:[14,21,23],pipelin:12,place:[1,4,5,6,8,18,24],placehold:[24,27],plai:[5,8,14,15,23],plain:23,plaintext:23,plan:10,plant:5,platform:[2,21,27],playback:[14,23],player:23,playlist:[14,23,24],playlist_items_list:23,playlistid:23,playlistitem:23,playlists_list:23,pleas:[7,8,14,16,18,21,23],png:[7,15,16],podcast:15,point:[5,8,14,20,23],pointer:12,polici:7,polish:[14,17,24],polit:[4,18,23],pop:23,popul:20,popular:[10,18,23,27],port:20,porto:1,portug:1,portugues:[14,15,17,24],posicionamiento:8,posit:[6,8,14,18,23],possibl:[9,10,13,14,21,27],post:[5,6,17,18,20,21,25,27],posts2:6,potato:5,potent:13,potenti:[16,18],potteri:15,pound:6,povertydata:7,power:[6,7,16],ppc:21,ppp046177196171:10,ppp089047044105:10,practic:[4,10,12,16,27],pre:[0,10,21,24,25,26],preced:24,prefer:18,preferenti:18,prefix:[8,24],preload:7,premier:15,prepar:[0,5,15,24,25,26],prepend:[18,20],present:[14,18,24],presidenti:15,pressur:16,pretti:16,prevent:[18,24],previou:[20,23,24],previous_cursor:18,prevpagetoken:[14,23],prg:7,price:[9,16,20],print:[5,6,10,15,17,24],prioriti:15,probabl:[4,16,27],process:[4,7,10,12,15],processingdetail:23,produc:[1,10,14,15,27],product1:20,product2:16,product:[0,1,2,8,9,14,16,20,21,24],profession:23,profil:[13,18],program:18,programmat:14,prohibit:13,project:[7,8,14,16,23,27],promis:27,promo:15,promot:15,proper:[6,27],properli:[9,10,14,15,20,23,24],properti:[4,14,16,23],protocol:7,prouc:14,provid:[1,2,4,6,9,10,12,13,14,15,16,18,20,21,23,24,27],proxi:12,proxito:[7,16],publication_languag:15,publication_nam:15,publish:[15,23],publishedaft:[14,23],publishedbefor:[14,23],pump:6,punctuat:24,puppi:18,purchas:9,purpl:14,purpos:13,put:[9,10,15,16,21],puzzl:23,pypi:24,pyt:16,pyth:16,python:[0,5,17,18,24,25,26,27],python_tweet:18,q:[7,14,18,23],q_80:15,qualifi:5,qualiti:[7,14],quantifi:21,queri:[0,8,10,13,14,15,18,23,24,25,26,27],query_:20,query_color:20,query_pric:20,query_s:20,query_tim:[8,24],querytim:[14,24],question:[0,2,15,18,21,22,24,25,26,27],question_mark:6,question_mark_count:6,question_mark_freq:6,question_mark_nam:6,question_marks_flat:6,question_marks_per_post:6,question_summari:6,question_text:6,questionnair:14,quick:[2,13,15],quickli:4,quit:[13,15,21],quot:22,quota:23,quotat:21,r3ynjjjcug:6,ra:15,race:[15,23],radio:15,radiu:18,rai:[7,16],rain:[6,21],rais:[16,24],ran:16,randolph:15,random:13,rang:[14,18],rank:[8,16,24,27],rapid:10,rate:[14,15,16,18,21,23],rate_limit_statu:18,rather:21,raw:11,rc2:7,re:[6,18,21],reachabl:16,read:[6,10,20],read_csv:6,read_json:[7,13,16],read_parquet:10,readabl:[11,13,16,27],reader:10,readi:[9,18],readm:16,readthedoc:[7,16,18],real:[6,18],realiti:13,realli:[7,9,10,16,21],reason:[4,6,7,10,13,16,24],receiv:[13,18],recent:[1,18,23],recip:[0,3,16,24,25],recommend:[6,10,16,18],recordingdetail:23,recurs:[7,15,16,24],red:[14,20],redirect:[10,16,24,27],redirect_from:10,redirect_reason:[7,16],redirect_tim:[7,16],redirect_to:10,redirect_ttl:[7,16],redirect_url:[7,16],redistrict:6,refer:[7,8,10,14,16,18,20],referer_:10,referer_dir_1:10,referer_dir_2:10,referer_dir_3:10,referer_frag:10,referer_hostnam:10,referer_last_dir:10,referer_netloc:10,referer_path:10,referer_port:10,referer_queri:10,referer_schem:10,referer_url:10,referer_url_df:10,referr:[7,19],referrerpolici:[16,24],reflect:24,regard:[16,21],regardless:[14,23],regex:[0,5,6,10,11,21,24,25,27],regex_raw:11,regga:23,region:[16,18,23],regioncod:[14,23],regular:[0,5,6,10,16,21,24,25,26],reilli:11,reinvent:15,rel:[4,8,12,13,16,20,24,27],rel_valu:[21,24],relat:[6,9,14,15,16,23,27],relatedsit:14,relatedtovideoid:[14,23],relayout:24,releas:24,relev:[9,14,18,19,23],relevancelanguag:[14,23],reli:16,reliabl:8,religion:23,remain:[2,15,22],remaind:[2,24],remark:16,rememb:16,remov:[14,16,18,21,22,23,24],renam:20,render:27,repeat:[6,20,24],repetit:6,replac:[1,10,15,20,24,27],repli:[18,23],repons:[24,27],report:[7,12,16,20,21,24,27],repres:[6,8,10,14,15,18],represent:18,request:[0,3,7,8,10,12,14,16,18,23,24,25,27],request_:10,request_dir_10:10,request_dir_11:10,request_dir_12:10,request_dir_13:10,request_dir_1:10,request_dir_2:10,request_dir_3:10,request_dir_4:10,request_dir_5:10,request_dir_6:10,request_dir_7:10,request_dir_8:10,request_dir_9:10,request_frag:10,request_headers_:16,request_headers_accept:[7,16],request_headers_cooki:16,request_headers_us:[7,16],request_hostnam:10,request_last_dir:10,request_netloc:10,request_path:10,request_port:10,request_queri:10,request_query_:10,request_query__:10,request_query_a:10,request_query_aam:10,request_query_abspath:10,request_query_act:10,request_query_adapt:10,request_query_ag:10,request_query_albid:10,request_query_cmd:10,request_query_cod:10,request_query_cont:10,request_query_control:10,request_query_cpabc_calendar_upd:10,request_query_curpath:10,request_query_currentset:10,request_query_dir:10,request_query_dn:10,request_query_email:10,request_query_fil:10,request_query_file_link:10,request_query_filenam:10,request_query_filepath:10,request_query_findcli:10,request_query_fn:10,request_query_folderid:10,request_query_format:10,request_query_funct:10,request_query_gid:10,request_query_id:10,request_query_img:10,request_query_index:10,request_query_input_fil:10,request_query_item:10,request_query_itemid:10,request_query_lang:10,request_query_libpath:10,request_query_mod:10,request_query_mypath:10,request_query_nam:10,request_query_next_fil:10,request_query_nocontinu:10,request_query_op:10,request_query_opt:10,request_query_ord:10,request_query_p:10,request_query_pag:10,request_query_panel:10,request_query_path:10,request_query_posit:10,request_query_psd:10,request_query_q:10,request_query_redirect:10,request_query_ref:10,request_query_rid:10,request_query_sb_categori:10,request_query_scopenam:10,request_query_search_kei:10,request_query_servic:10,request_query_short:10,request_query_sit:10,request_query_srt:10,request_query_step:10,request_query_stockcodeintern:10,request_query_target:10,request_query_term:10,request_query_thumb:10,request_query_titl:10,request_query_todo:10,request_query_typ:10,request_query_typeid:10,request_query_url:10,request_query_usernam:10,request_query_v:10,request_query_var:10,request_query_wt:10,request_query_xdebug_session_start:10,request_schem:10,request_url:10,request_url_df:10,requir:[10,14,15,16,18,19,23],rerun:4,resampl:15,research:[9,13,27],resolut:[14,23],resourc:[10,14,16,18,23,27],resourceid:23,resp_headers_:16,resp_headers_access:16,resp_headers_ag:[7,16],resp_headers_alt:7,resp_headers_cach:[7,16],resp_headers_cf:[7,16],resp_headers_cont:[7,16],resp_headers_d:[7,16],resp_headers_etag:7,resp_headers_expect:[7,16],resp_headers_expir:[7,16],resp_headers_last:[7,16],resp_headers_permiss:7,resp_headers_referr:7,resp_headers_serv:[7,16],resp_headers_strict:[7,16],resp_headers_vari:[7,16],resp_headers_via:7,resp_headers_x:[7,16],resp_meta_:24,respect:[2,4,10,16,18,21,24],respons:[0,8,10,13,14,15,16,18,23,24,25,26,27],rest:[6,8,13],restaur:6,restrict:[2,8,14,16,18,23,24],result:[0,1,4,5,10,13,15,16,18,20,21,23,24,25,26,27],result_typ:18,resultscor:8,resum:[0,3,25,27],retain:[9,20],retreiv:[4,15,24],retriev:[14,15,18,23],returnd:24,retweet:[18,21],retweeted_of_m:18,retweets_of_m:18,reus:[14,23],reveal:15,revenu:21,revers:[0,10,14,18,23,24,25,26],reverse_dns_lookup:[10,12,24,27],review:[10,14,15,23],rewrit:24,rfc:[14,23],rhythm:23,rich:[15,18],richer:16,right:[9,10,14,15,20],right_char:6,rio:9,risk:15,rm_word:21,rn:15,rnkt7myjj7hcnsvbnzg9qdqizefftx9ytz3:7,robot:[0,3,10,15,16,24,25,26,27],robots_output_fil:13,robots_url:13,robotsfiles_df:13,robotstxt:24,robotstxt_df:13,robotstxt_last_modifi:[13,24],robotstxt_obei:[4,7],robotstxt_test:[13,24],robotstxt_test_df:13,robotstxt_to_df:[13,24],robotstxt_url:13,robotx:13,rock:23,rogen:15,role:[20,23],rolling_new:15,romanian:[14,17,24],root:18,row:[9,10,13,14,15,21],rsvp:6,rtd:[7,16],rtl:6,rule:[0,3,7,10,13,16,20,25,27],run:[0,4,5,8,9,12,13,14,15,16,18,20,21,24,25,26,27],russia:15,russian:[14,15,17,24],s22:15,s:[0,1,2,4,6,7,9,10,13,14,15,16,18,20,21,23,24,25,26,27],safari:10,safe:[14,18],safesearch:[14,23],safeti:14,safetycheck:13,sai:[6,9,14,16,21,27],said:[6,13],sail:[14,23],sale:21,same:[0,1,2,3,5,6,8,9,10,13,14,15,16,18,20,21,23,24,25,27],sampl:[5,8,15,16],sample_log:10,samsung:15,sara:15,satisfi:10,save:[0,3,7,10,13,16,24,25,27],saver:6,scale:[0,12,24,25,26],scari:18,scenario:2,schauspielerin:8,schema:8,scheme:[15,20],scienc:[15,27],scientist:27,score:[8,21],scrape:[0,3,10,16,24,25],scraper:10,scrapi:[7,16,27],screen:18,screen_nam:18,script:[4,7],script_src:4,sd:[14,23],seahawk:15,search:[0,7,8,13,15,18,19,20,23,24,25,26,27],search_us:18,searchterm:23,searchtyp:14,seattl:15,sec:16,second:[2,4,6,8,9,14,16,20,24,27],section:[13,14,23],secur:[7,16],see:[2,4,5,6,8,12,13,14,15,16,18,20,21,22,23],seem:[15,16,21],seen:10,segment:[9,18],selecotr:16,select:[10,14,16,18,23],selector:[0,24,25,26,27],selector_1:16,selector_2:16,self:20,sell:[9,15],sem:[0,16,24,26],sem_campaign:9,semi:18,semrush:27,senat:15,senatewinn:15,send:[8,10,18,27],sendfil:[7,16],sens:[20,21],sensit:[4,9,18],sent:[14,18,23],sentenc:[6,21],seo:[0,3,8,9,13,15,21,24,26],seop:8,seoul:8,sep:[2,24],separ:[2,6,10,14,16,18,20,23,24],sequenc:21,serbian:14,seri:15,seriou:21,serp:[0,8,20,24,25,26,27],serp_:[14,27],serp_goog:[14,16,24,27],serp_youtub:[14,24],serv:[7,16],server:[0,3,7,10,12,14,16,23,25],servic:[5,8,9,14,15],session:[10,14,18],set:[0,2,3,7,8,9,10,14,15,18,20,21,22,23,24,25,26,27],set_auth_param:18,set_index:15,set_logging_level:14,seth:15,setup:[0,24,25,26],sever:[0,4,7,10,14,18,21,23,24,25,26,27],seznambot:13,shape:[6,10,15],share:[11,16,21],shatel:12,she:[6,21],sheet:[24,27],shift:9,shoe:[16,21],shop:[2,16],shorter:[2,23,24],should:[1,4,6,7,8,13,14,16,18,21,23],shouldn:[9,10],shout:6,show:[5,6,8,9,10,14,16,20,21,23,24],show_list:18,show_owned_list:18,shown:[8,20],si:15,side:[6,10,21,22],sidebar:[16,24],sidebar_link:16,sidebar_links_url:16,sign:[6,13,16,20,22],signatur:18,signifi:9,similar:[1,6,16,20,23,24],similarli:[14,16,23],simpl:[4,5,6,7,12,15,16,18,21,27],simpler:24,simplest:[16,20],simpli:[4,9,10,12,13,15,16,21],simplifi:[7,14,23],simul:23,simultan:16,sinc:[1,2,6,7,15,16,18,21],since_id:18,sine:7,singapor:1,singl:[10,13,14,16,18],singular:6,sinhala:[17,24],site:[4,9,13,14,15,16,20,21,23,24,27],site_crawl:16,site_scraping_tos_term:13,sitemap:[0,13,16,20,24,25,26,27],sitemap_df:15,sitemap_download:24,sitemap_last_modifi:[15,24],sitemap_size_mb:[15,24],sitemap_to_df:[15,16,24],sitemap_url:15,sitemapindex:24,sitename_crawl_yyyy_mm_dd:16,sitesearch:14,sitesearchfilt:14,sitmeapindex:15,situat:20,sivasubramanian:15,six:[2,21],sixti:21,size:[7,10,13,14,15,16,18,20,24],skateboard:15,skin:5,skip:[16,24],skip_statu:18,skip_url_param:24,slectorgadget:16,slice:18,slight:24,slot:[1,2,24,27],slovak:14,slovenia:5,slovenian:14,slow:[0,3,25],slug:[15,18,20],slurp:13,sm:20,small:[5,13,14,23],smaller:[15,23,24],smartphon:[10,15],smile:5,smilei:[5,6],snippet:[14,16,23,24],snow:[6,21],so:[0,2,3,6,7,8,9,10,13,14,15,16,18,20,21,23,25,27],social:[5,6,16,17,20,21],societi:23,softwareappl:8,solut:4,some:[4,5,6,7,10,12,13,14,15,16,18,20,21,23,24,27],somehow:21,someon:21,someth:[1,2,21],sometim:[2,4,9,13,16,21,27],somewher:[21,27],soon:13,sophist:27,sort:[14,17,20,21,23,24],soul:23,sound:6,sourc:[1,2,5,6,7,8,9,10,12,13,14,15,16,18,19,20,21,22,23],source_fil:10,south:8,space:[2,14,15,18,22],spaci:[17,24],spam:23,span:[16,24],spanish:[6,14,17,24],speak:14,special:[6,15,16,20,24,27],specif:[7,14,18,23,27],specifi:[0,2,3,6,8,10,13,14,16,18,22,23,24,25,27],speed:[7,16,24],spend:[6,18,27],spent:27,spider:[0,4,7,10,24,25,26,27],split:[0,2,10,15,16,21,22,24,25,26,27],sport:[5,15,23],spread:27,squar:5,square_bann:19,src:[4,16,24],srcset:[16,24],ss:23,stage:10,standard:[14,16,18,20,23,27],star:[1,15],start:[2,4,6,7,9,10,14,15,16,18,21,23,24,27],start_request:7,starting_out:18,stat:[4,5,6,24],state:[8,14,15,20,23],static01:15,statist:[5,6,12,23,24,27],statu:[0,5,10,16,18,23,24,25,26,27],status:18,stdout:10,stearn:15,step:[8,22],still:[2,6,14,15,18,21,23],stiller:15,stitch:27,stop:[0,3,16,21,24,25,27],stopword:[0,21,24,25,26,27],storag:[10,15],store:[10,16],str:[1,2,5,6,7,9,10,13,15,16,18,19,21],straight:7,straightforward:[6,16,20],strateg:[15,27],strategi:[0,3,7,9,13,15,16,23,25],stream:18,strict:[14,23],stricter:24,string:[1,2,5,6,8,9,11,14,18,19,22,23,24],stringify_id:18,strip:[18,21,22],strongli:[16,18],structur:[0,4,7,9,15,18,24,25,26,27],stuff:[2,27],style:[13,16,24],stylesheet:4,sub:[0,3,5,6,10,13,15,16,18,20,24,25,27],sub_group:5,subdomain:[7,16],submodul:[16,24,25,26],subpackag:[24,25,26],subscrib:[18,23],subscribersnippet:23,subscript:[18,23],subscription_order_relev:23,subscriptions_list:23,subsequ:[14,23],subset:15,substr:8,suchmaschinenmarket:8,suchmaschinenoptimierung:8,sugar:6,suggest:[4,20,23],suit:10,suitabl:8,sulli:8,summar:[5,6,10],summari:[5,6,24],summer_promo:19,superhero:18,suppli:[12,14,24],support:[0,7,13,14,16,18,23,24,25,26,27],suppos:[13,20],sure:[0,1,2,3,6,7,12,14,16,18,20,24,25],surround:[6,24],surrounding_text:6,survei:14,susan:15,suspend:18,svc:7,swami:15,swedish:[14,17,24],sweet:6,sy:10,sym:6,symbol:[5,6,24],syndic:[14,23],system:[10,24],sytem:20,sz:23,t:[0,1,3,6,7,9,10,14,16,20,21,22,24,25,27],tabl:[8,9,16,27],tablet:15,tackl:27,tag:[4,7,13,14,15,16,23,24,27],tagalog:[17,24],tail:9,take:[2,4,6,8,9,10,13,15,16,18,20,21,24,27],talk:2,tamil:[17,24],target:[9,23],task:[7,9,21,22,27],tatar:[17,24],tc2:15,tea:6,teach:15,teal:14,team:15,technic:[8,27],techniqu:[4,21,27],technolog:[8,23],tediou:[9,20],telegrambot:13,tell:16,telugu:[17,24],templat:[1,2,15],temporari:10,ten:[14,21],tenni:23,teoma:13,term:[14,16,19,23,27],test:[0,5,24,25,26],tester:[0,24,25,26],text:[0,1,4,7,10,16,17,18,22,23,24,26],text_ad:2,text_list2:21,text_list:[5,6,21,22],textformat:23,textual:[5,6],thai:[17,24],than:[1,2,13,14,16,18,21,23,24,27],thei:[4,6,10,12,13,14,15,16,18,20,21,22,23,24],them:[0,2,3,6,7,9,10,12,13,15,16,18,20,21,24,25,27],themselv:[21,24],thenc:21,theoffic:6,thereaft:21,therebi:[21,23],therefor:[4,14,21,23],therein:21,thereupon:21,thi:[1,2,4,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,24,25,27],thing:[1,2,6,8,9,15,16,20,22,25,27],think:[6,16,20],third:[16,18,21],those:[0,2,3,7,8,9,10,12,13,14,15,16,20,21,23,24,25,27],though:[13,14,16,18,21,23],thought:8,thousand:[4,5,7,12,21,27],thread:[15,23,24],three:[1,4,6,15,16,18,20,21,24,27],through:[4,7,10,13,14,15,16,18,21,22,23,27],throughout:21,thru:21,thu:[7,16,21],ticket:14,tiktok:6,time:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,18,21,23,24,27],timecr:23,timelin:18,timeout:24,timestamp:10,tini:13,tip:7,titl:[4,6,9,14,16,20,21,23,24,27],tl:10,tld:[14,24],to_datetim:10,to_parquet:10,toctre:16,todai:[1,5,6],togeth:[5,6,10,13,18,20,21,27],token:[0,21,24,25,26],token_typ:18,tokyo:1,tolist:[13,15],tommi:15,tone:5,too:[0,3,6,16,21,25,27],took:16,tool:[0,7,10,14,15,16,20],top:[0,5,6,8,9,10,12,14,15,16,18,20,21,23,24,25,26,27],top_bot:10,top_currency_symbol:6,top_domain:6,top_emoji:[5,6],top_emoji_categori:24,top_emoji_group:[5,6],top_emoji_sub_categori:24,top_emoji_sub_group:[5,6],top_emoji_text:[5,6],top_exclamation_mark:6,top_hashtag:6,top_ment:6,top_numb:6,top_question_mark:6,top_tld:6,top_url:6,top_word:6,topic1:20,topic2:20,topic:[14,15,18,20,23,24],topic_1:20,topic_2:20,topicdetail:23,topicid:[14,23],tor:10,total:[2,10,13,21],tourism:23,toward:[18,21],town:24,toyota:[1,9],traceback:1,track:[23,24,27],tracker:15,tradit:[14,23],traffic:[16,18,19],trail:22,train:6,transport:[7,15,16],travel:[5,6],trend:[18,21,27],tricki:16,trigger:4,trim:22,trim_us:18,trip:9,truestatus:18,truncat:16,tuesdai:6,turkc:15,turkish:[14,17,24,27],turn:14,tutor:9,tutori:[9,16,27],tv:[15,23],tw:14,tweet:[6,17,18,21,27],tweet_:18,tweet_mod:18,tweet_text:6,twelv:21,twenti:[9,13,21],twice:[0,3,21,24,25],twimg:18,twitter:[0,4,6,7,13,16,19,24,25,26,27],twitterbot:[10,13],two:[1,2,4,6,9,11,13,14,16,20,21,23,24,27],twtr_content:4,twtr_name:4,twython:[18,24],txt:[0,3,5,10,15,16,24,25,26,27],type:[4,6,7,8,9,10,14,16,18,20,23,24,27],typic:[1,2,6,7,10,12,14,15,16,18,20,21,23,27],u5vdyevvf:6,ua:10,ua_:10,ua_devic:10,ua_df:10,ua_famili:10,ua_major:10,ua_minor:10,ua_o:10,ua_pars:10,ua_patch:10,ua_str:10,ubuntu:7,ug:17,uk:14,ukchina:15,ukrainian:[17,24],ultra:15,unalign:20,und:10,under:[4,7,8,10,13,21,24],underscor:15,understand:[8,9,13,14,15,18,20,27],understood:8,unexpect:16,unicod:[5,11],unifi:24,uniqu:[23,24],unique_currency_symbol:6,unique_emoji:[5,6],unique_exclamation_mark:6,unique_hashtag:6,unique_ment:6,unique_numb:6,unique_question_mark:6,unique_url:6,unique_word:6,unit:[14,15,18,23],unknown:[10,12],unless:[13,21],unlik:20,unlock:16,unnest:18,unpack:15,unread:23,unsign:[14,23],unspecifi:14,until:[6,18,21],unusu:20,up:[2,7,8,9,14,16,18,20,21,24,27],upcom:[14,23,27],updat:[4,15,24],upload:[9,14,15,18,23],upon:21,urdu:[15,17,24],uri:[7,16],url:[0,2,4,6,7,8,10,11,13,14,15,18,21,23,24,25,26,27],url_:27,url_build:16,url_count:6,url_df:15,url_freq:6,url_list:[4,7,10,16],url_path:13,url_redirected_to:24,url_summari:6,url_to_df:[10,15,20,24,27],url_utm_ga:[19,24],urls_flat:6,urls_per_post:6,urls_to_test:13,urlth:14,urlyt:10,us:[0,1,4,5,6,7,9,10,11,12,13,14,15,16,17,18,20,21,23,24,25,26,27],usa:14,usag:[5,6,16,18,27],usd:6,usemap:[16,24],user:[0,3,6,9,10,12,14,16,18,23,24,25,26,27],user_:18,user_ag:[4,7,10,13,16],user_agent_pars:10,user_id:18,user_ment:18,user_timelin:18,userag:13,usernam:23,usual:[4,8,12,18,20,21],usuali:10,utc:15,utf:[7,18],util:[2,18],utm:[19,24],utm_campaign:19,utm_cont:19,utm_medium:19,utm_sourc:19,utm_term:19,v11:11,v13:[5,24],v1642801328:15,v1644335726:15,v1644381627:15,v1644418652:15,v1644595412:15,v1:8,v271:15,v274:15,v281:15,v282:15,v285:15,v286:15,v290:15,v2_0_0m1638886228:10,vacanc:9,valid:[6,14,18,19,23],valu:[2,4,7,8,10,14,15,16,18,20,21,23,24],value_count:[10,15],valueerror:[1,24],variabl:24,varieti:18,variou:[5,6,7,15,21,24],ve:24,veget:5,vegetable_emoji:5,vegur:7,vehicl:23,venti:6,verb:9,veri:[1,4,7,8,9,10,12,13,15,16,18,20,21,24,27],verifi:[12,15],versatil:24,version:[7,10,16,24],via:[14,18,21,23],vibe:6,vid_id:14,video:[0,13,14,18,21,23,24,25,26,27],video_categories_list:23,video_content_loc:15,video_descript:15,video_dur:15,video_expiration_d:15,video_publication_d:15,video_thumbnail_loc:15,video_titl:15,videocapt:[14,23],videocategori:23,videocategoryid:[14,23],videocount:[14,23],videodefinit:[14,23],videodimens:[14,23],videodur:[14,23],videoembedd:[14,23],videoid:23,videolicens:[14,23],videos_list:23,videosynd:[14,23],videotyp:[14,23],vietnames:[15,17,24],view:[8,14,18,21,23],viewcount:[14,23],viewer:[14,23],viewport:[4,16,24],vine:18,violat:23,virginia:15,visit:6,visual:27,vmi660635:10,volleybal:23,von:8,vp:15,vs:[0,15,25],w3c:16,w:[7,14,15],w_320:15,wa:[4,5,6,10,13,15,16,18,21,24],wai:[2,4,6,7,10,15,16,18,20,24,27],wait:[4,16],walk:15,wall:10,want:[0,1,2,3,5,6,7,8,9,10,12,13,14,15,16,18,20,21,22,23,25,27],warn:14,watch:[1,15,18],water:6,we:[2,6,8,9,10,13,15,16,20,21,27],web000079:16,web00007a:16,web00007c:16,web00007g:16,web00007h:16,web00007k:16,web:[7,8,14,15,16,17],webpag:[14,23],websit:[0,3,8,10,13,14,15,16,23,24,25,27],website_name_crawl_1:4,website_name_crawl_2:4,wed:16,week:[14,15,18,27],weight:[0,24,25,26,27],well:[6,7,9,10,12,13,14,15,16,18,20,21,22,23,24,27],went:10,were:[10,14,15,18,21,23,24],weren:10,west:15,what:[2,4,5,6,7,8,9,10,12,13,15,16,18,20,21,27],whatev:[21,27],when:[1,4,6,7,8,10,13,14,15,16,18,21,23,24,27],whenc:21,whenev:21,where:[2,4,6,7,10,14,15,16,18,20,21,24,27],wherea:21,whereaft:21,wherebi:21,wherein:21,whereupon:21,wherev:21,whether:[1,2,4,6,8,9,10,13,14,15,16,18,20,21,23,24],which:[2,4,6,7,8,10,13,14,15,16,17,18,20,21,22,23,24,27],whichev:[16,20,24],white:[6,14,22],whitespac:[2,21,22,24],whither:21,who:[4,6,13,14,15,18,21,23],whoever:21,whole:[5,7,16,21],whom:[18,21],whose:[14,21],why:[4,10,13,21],width:[16,23,24],wilson:15,win64:10,win:[15,21],window:[10,16],wire:15,wired_autocomplet:15,wired_first:15,wired_reinv:15,wired_seth:15,wired_video:15,wired_wir:15,within:[1,2,9,14,16,18,21,22,23],without:[4,7,14,16,21,23,24,27],woeid:18,won:[4,6,27],word:[0,1,2,5,6,8,9,10,14,15,18,24,25,26,27],word_count:6,word_freq:6,word_frequ:[21,22,24,27],word_summari:6,word_token:[22,24],words_flat:6,words_per_post:6,words_to_extract:6,words_to_find:6,work:[4,6,8,9,10,13,16,18,21,23,27],worker:[12,15],world:15,worldnew:15,worri:[4,13],worth:5,would:[2,4,6,10,13,14,15,16,18,20,21,23],wrangl:27,wrap:24,wrestl:23,write:2,written:[6,13,14,15],wrong:[10,13],wtd_freq:[21,24],wtd_freq_perc:21,wtd_freq_perc_cum:21,www:[5,6,7,10,13,15],x11:10,x64:10,x86_64:10,x:[8,9,10,14,15,16,27],xhtml:[7,16],xlarg:14,xm:16,xml:[0,7,13,20,24,25,26,27],xpath:[0,3,24,25,26,27],xpath_selector:[16,24],xxlarg:14,y:[10,14],yahoo:18,yandex:13,yandexbot:10,ye:[7,8],yea:8,year:[14,15,18],yellow:[5,14],yet:[9,16,20,21],yeti:13,york:15,you:[1,2,4,5,6,7,8,9,10,12,13,14,15,16,17,18,20,21,22,23,25,27],your:[2,4,5,6,7,8,9,10,12,13,14,16,18,19,20,21,23,25],your_app_kei:18,your_app_secret:18,your_cx:14,your_google_developer_kei:8,your_kei:14,your_oauth_token:18,your_oauth_token_secret:18,your_user_ag:4,yourself:[16,21],yourselv:21,yout:20,youtub:[0,8,21,24,25,26,27],youtube_channel_detail:14,youtube_video_detail:14,youuuuuu:6,youuuuuuu:6,yymmdd_article_titl:15,yyyi:[15,18,23],z:10,zero:[8,14,16,23],zgrab:10,zh:[14,23],ziggozakelijk:10,zip:[6,10,24],zo0cnvuigj:6,zs:15},titles:["advertools package","Create Ads on a Large Scale","Create Ads Using Long Descriptive Text (top-down approach)","advertools.code_recipes package","\ud83d\udd77 SEO Crawling & Scraping: Strategies & Recipes","Emoji: Extract, Analyze, and Get Insights","Extract structured entities from text lists","\ud83d\udd77 Python Status Code Checker with Response Headers","Import and Analyze Knowledge Graph Results on a Large Scale","Generate Keywords for SEM Campaigns","Log File Analysis","Regular Expressions for Extracting Structured Entities","Reverse DNS Lookup in Bulk","\ud83e\udd16 Analyze and Test robots.txt Files on a Large Scale","Import Search Engine Results Pages (SERPs) for Google and YouTube","Download, Parse, and Analyze XML Sitemaps","\ud83d\udd77 Python SEO Crawler / Spider","Stopwords in Several Languages","Twitter Data API","URL Builders","Split, Parse, and Analyze URL Structure","Text Analysis","Tokenize Words (N-grams)","YouTube Data API","advertools","advertools","advertools","advertools: productivity & analysis tools to scale your online marketing"],titleterms:{"0":24,"01":24,"02":24,"03":24,"04":24,"05":24,"06":24,"07":24,"08":24,"09":24,"1":24,"10":24,"11":24,"12":24,"1234567890\u0660\u0661\u0662\u0663\u0664\u0665\u0666\u0667\u0668\u0669\u32ba\ud804\udc5b\ud800\udd0d\ud802\udcaa\u24f2\ud804\udc63\ud800\udd28\ud802\udd1b":6,"13":24,"14":24,"17":24,"18":24,"19":24,"2":24,"2018":24,"2019":24,"2020":24,"2021":24,"2022":24,"21":24,"23":24,"25":24,"26":24,"27":24,"29":24,"3":24,"30":24,"31":24,"4":24,"5":24,"6":24,"7":24,"8":24,"9":24,"\u0294":6,"do":4,"function":[6,10,16,18],"import":[8,14],"long":2,"new":[15,16],"while":[4,16],On:16,The:20,absolut:21,account:8,ad:[1,2],addit:16,advertool:[0,3,24,25,26,27],agent:[4,13],analysi:[10,21,25,27],analyt:16,analyz:[5,8,10,13,15,20],api:[8,18,23],approach:[2,13,16],articl:[2,16],audit:4,authent:18,automat:4,base:4,behavior:16,builder:19,bulk:[12,13],campaign:[9,27],can:4,certain:4,chang:[24,25],checker:7,code:7,code_recip:3,concurr:4,condit:4,consol:16,content:[0,3,25,27],control:4,convent:27,copi:4,count:21,crawl:[4,10,16],crawler:16,creat:[1,2],css:16,currenc:6,custom:[4,16],data:[10,16,18,23],datafram:10,depth:4,descript:2,determin:16,di:4,directori:20,discoveri:16,dn:12,domain:4,don:4,down:[2,4],download:15,element:16,emoji:[5,6],engin:14,entiti:[6,11],exclam:6,express:[4,11],extract:[4,5,6,11,16],facebook:2,feed:2,file:[10,13],follow:[4,16],format:10,frequenc:21,from:[4,5,6],gener:9,get:5,googl:[2,8,14,16],gram:22,graph:8,hard:4,hashtag:6,header:7,hit:4,how:[4,8,10],i:4,includ:4,index:[15,25],indic:25,insight:5,instal:27,instant:2,its:4,job:4,keyword:9,knowledg:8,languag:17,larg:[1,8,13],later:4,link:[4,16],list:[4,6,16],log:[4,10,24,25],logs_to_df:10,lookup:12,make:4,market:[25,27],media:[25,27],mention:6,mode:[4,16],modul:[0,3],multipl:4,my:4,n:22,number:[4,6],obei:4,onli:4,onlin:[25,27],packag:[0,3],page:[4,14,16],paramet:[16,20],pars:[10,15,20],path:20,pattern:16,paus:4,pre:16,prepar:10,product:[25,27],python:[7,16],queri:[16,20],question:6,recip:4,regex:16,regular:[11,15],request:4,respons:7,result:[8,14],resum:4,revers:12,robot:[4,13],rule:4,run:10,s:8,same:4,save:4,scale:[1,8,13,27],scrape:4,search:[5,14,16],selector:16,sem:[9,25,27],seo:[4,16,25,27],serp:[14,16],server:4,set:[4,16],setup:8,sever:17,sitemap:15,slow:4,so:4,social:[25,27],specifi:4,spider:16,split:20,statu:7,stop:4,stopword:17,strategi:4,structur:[6,11,20],sub:4,submodul:[0,3],subpackag:0,support:10,sure:4,t:4,tabl:25,test:13,tester:13,text:[2,5,6,21,25,27],them:4,those:4,token:22,too:4,tool:[25,27],top:2,twice:4,twitter:18,txt:[4,13],url:[16,19,20],us:[2,8],user:[4,13],video:15,vs:21,want:4,websit:4,weight:21,word:[21,22],xml:15,xpath:[4,16],your:27,youtub:[14,23]}}) \ No newline at end of file diff --git a/docs/conf.py b/docs/conf.py index 2c45aa0b..32c1cae4 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -23,7 +23,7 @@ # -- Project information ----------------------------------------------------- project = 'advertools' -copyright = '2021, Elias Dabbas' +copyright = '2022, Elias Dabbas' author = 'Elias Dabbas' # The short X.Y version @@ -74,8 +74,8 @@ # directories to ignore when looking for source files. # This pattern also affects html_static_path and html_extra_path . exclude_patterns = [ -# '_build', - 'Thumbs.db', +# '_build', + 'Thumbs.db', '.DS_Store', ]