zeus-fyi
diff --git a/‎.github/workflows/zeusfyi_docs.yml
-1 b/‎.github/workflows/zeusfyi_docs.yml
-1
diff --git a/‎.gitignore
+1 b/‎.gitignore
+1
diff --git a/‎README.md
+1-6 b/‎README.md
+1-6
diff --git a/‎apps/docusaurus/zeusfyi/docs/lb/plans/discover.md
-27 b/‎apps/docusaurus/zeusfyi/docs/lb/plans/discover.md
-27
diff --git a/‎apps/docusaurus/zeusfyi/docs/lb/plans/lite.md
-27 b/‎apps/docusaurus/zeusfyi/docs/lb/plans/lite.md
-27
diff --git a/‎apps/docusaurus/zeusfyi/docs/lb/plans/performance.md
-28 b/‎apps/docusaurus/zeusfyi/docs/lb/plans/performance.md
-28
diff --git a/‎apps/docusaurus/zeusfyi/docs/lb/plans/standard.md
-28 b/‎apps/docusaurus/zeusfyi/docs/lb/plans/standard.md
-28
diff --git a/‎examples/mockingbird/mockingbooks_py/api_setup.py
+2-2 b/‎examples/mockingbird/mockingbooks_py/api_setup.py
+2-2
diff --git a/‎examples/mockingbird/mockingbooks_py/google_search_regex/google_api_searches.py
+1-1 b/‎examples/mockingbird/mockingbooks_py/google_search_regex/google_api_searches.py
+1-1
diff --git a/‎examples/mockingbird/mockingbooks_py/google_search_regex/html_regex_example.py
+55-32 b/‎examples/mockingbird/mockingbooks_py/google_search_regex/html_regex_example.py
+55-32
@@ -40,4 +40,3 @@ jobs:
           --token ${{ secrets.DEPOT_TOKEN }} \
           --provenance=false \
           -f docker/docusaurus/Dockerfile . --push
-
@@ -70,3 +70,4 @@ Thumbs.db
 /examples/mockingbird/python/mock/
 /examples/mockingbird/mockingbooks_py/mock/
 /examples/mockingbird/mockingbooks_py/google_search_regex/tmp/
+/examples/mockingbird/mockingbooks_py/lead_scoring_automation/tmp/
@@ -150,9 +150,6 @@ Workflow & Proxy Programmable Automation (Rolling releases coming through end of
 #### ```artemis_workflows ```
 #### ```iris_programmable_proxy ```
 
-QuickNode MarketPlace users can find Load Balancing documentation in the iris programmable proxy directory
-+ Adaptive Load Balancer Documentation
-  
 #### API Endpoints 
 
 Documentation and code examples are found here
@@ -274,7 +271,7 @@ Recommended reading for scientists, engineers, data driven individuals
 
 https://medium.com/zeusfyi/show-me-the-stats-6740f8d6d0b7
 
-## Adaptive RPC Load Balancer on QuickNode Marketplace
+## Adaptive RPC Load Balancer
 Accurate, Reliable, Performant Node Traffic at Web3 Scale
 
 ![Screenshot 2023-09-14 at 11 11 30 PM](https://github.com/zeus-fyi/zeus/assets/17446735/802b7670-6b30-4e65-9348-e45e2a0cfcac)
@@ -283,5 +280,3 @@ https://medium.com/zeusfyi/adaptive-rpc-load-balancer-on-quicknode-marketplace-e
 
 ![Screenshot 2023-09-14 at 11 13 55 PM](https://github.com/zeus-fyi/zeus/assets/17446735/1d2a263e-5aa7-418c-a0f0-1f497cab0353)
 
-Beta Testing Sign Up (free to use): 
-https://marketplace.quicknode.com/add-on/zeusfyi-4
@@ -9,10 +9,10 @@
     'Authorization': f'Bearer {bearer_token}'
 }
 
-# api_v1_path = "https://api.zeus.fyi/v1"
+api_v1_path = "https://api.zeus.fyi/v1"
 
 
-api_v1_path = "http://localhost:9001/v1"
+# api_v1_path = "http://localhost:9001/v1"
 
 
 def get_headers():
 
@@ -7,7 +7,7 @@ def create_google_regex_search_index_entities_wf(task_str_id, eval_str_id, agg_t
     with open('mocks/workflow.json', 'r') as file:
         jdata = json.load(file)
 
-    jdata['stepSize'] = 5
+    jdata['stepSize'] = 15
     jdata['stepSizeUnit'] = 'minutes'
 
     # Add a task to the workflow
 
@@ -1,18 +1,9 @@
 import json
 import re
+import time
 
 from examples.mockingbird.mockingbooks_py.entities import EntitiesFilter, search_entities
-
-# Path to the file
-file_path = 'tmp/tmp.txt'
-
-# Open the file and read its contents
-with open(file_path, 'r') as file:
-    text = file.read()
-
-# Define two patterns
-pattern1 = r'data-anonymize="person-name">\s*([^<]+?)\s*</a>'
-pattern2 = r'<span data-anonymize="company-name">\s*([^<]+?)\s*</span>'
+from examples.mockingbird.mockingbooks_py.google_search_regex.dynamic_google_search import start_wf
 
 agg_prompt = ("Can you summarize the relevant person and/or associated business entity from the search results? It "
               "should use the most relevant search result that matches best and ignore others to prevent mixing"
@@ -23,35 +14,67 @@
               "with the metadata sources that are associated from that platform, business, ie. LinkedIn, Twitter, etc."
               "so that we associate the correct entity metadata with the correct platforms.")
 
-# Find all matches for both patterns
-matches1 = re.findall(pattern1, text)
-matches2 = re.findall(pattern2, text)
 
-# Check if lengths are equal
-if len(matches1) > len(matches2):
-    matches1, matches2 = matches2, matches1
+# Function to process each <li> element
+def process_li_element(li_text):
+    # Define the patterns for extracting person's name and company
+    name_pattern = r'data-anonymize="person-name">\s*([^<]+?)\s*</span>'
+    # Updated company pattern to stop at the first '<' character, ensuring no '>' is included
+    company_pattern = r'data-anonymize="company-name"[^>]*>\s*([^<]+?)\s*<'
+
+    # Search for name and company within the <li> element text
+    name_match = re.search(name_pattern, li_text)
+    company_match = re.search(company_pattern, li_text)
+
+    # If both name and company are found, return them
+    if name_match and company_match:
+        return name_match.group(1), company_match.group(1)
+    else:
+        return None
+
+
+def iterate_on_matches():
+    # List to store all matches
+    all_matches = []
+    count = 0
+
+    # Process files from page1 to page60
+    for page_num in range(1, 61):
+
+        file_path = f'tmp/page{page_num}.txt'
+
+        # Open the file and read its contents
+        with open(file_path, 'r') as file:
+            text = file.read()
+        # Assuming 'text' contains the HTML content from your file
+        # Define the regex pattern to capture each <li> element
+        li_pattern = r'<li class="artdeco-list__item[^>]*>.*?</li>'
+
+        # Find all <li> elements
+        li_elements = re.findall(li_pattern, text, re.DOTALL)
 
-offset_l = 80
-offset_r = 100
+        # Process each <li> element to extract names and companies
+        matches = [process_li_element(li) for li in li_elements]
 
-# skip next
-# for i in range(len(matches1)):
-#     person_company = f"{i}:{matches1[i]} (company)"
-#     if 0 + offset_l < i < 1 + offset_r:
-#         print(person_company)
-#         start_wf(person_company, agg_prompt)
+        # Filter out any None results
+        matches = [match for match in matches if match is not None]
 
+        # Iterate and print each match
+        for name, company in matches:
+            count += 1
 
-# Example iteration and action simulation with 'start_wf' function.
-# Since the 'start_wf' function is a conceptual example, we'll simulate its operation as a print statement.
-# for person_company in formatted_people_companies:
-#     # Simulate calling 'start_wf' function with the person_company tuple and aggregated prompt.
-#     start_wf(person_company, agg_prompt)
-#
+            if count > 722:
+                nc = f'Name: {name}, Company: {company}'
+                print(nc)
+                start_wf(nc, agg_prompt)
+                all_matches += [(name, company)]
+                count += 1
+                time.sleep(10)
+        print(count)
 
-# skip next
 
 if __name__ == '__main__':
+    iterate_on_matches()
     search_entities_f = EntitiesFilter()
 
     pretty_data1 = search_entities(search_entities_f)
Original file line number	Diff line number	Diff line change
`@@ -9,10 +9,10 @@`
`9`	`9`	`'Authorization': f'Bearer {bearer_token}'`
`10`	`10`	`}`
`11`	`11`
`12`		`-# api_v1_path = "https://api.zeus.fyi/v1"`
	`12`	`+api_v1_path = "https://api.zeus.fyi/v1"`
`13`	`13`
`14`	`14`
`15`		`-api_v1_path = "http://localhost:9001/v1"`
	`15`	`+# api_v1_path = "http://localhost:9001/v1"`
`16`	`16`
`17`	`17`
`18`	`18`	`def get_headers():`