Deleted a bunch of files and cleaned things up. Started the script for finding correct domain names for Anthology. Recast templates. Todolist.
This commit is contained in:
BIN
Scripts/Anthology/__pycache__/domains_list.cpython-310.pyc
Normal file
BIN
Scripts/Anthology/__pycache__/domains_list.cpython-310.pyc
Normal file
Binary file not shown.
8
Scripts/Anthology/antho-map-domains-from-csv.py
Normal file
8
Scripts/Anthology/antho-map-domains-from-csv.py
Normal file
@ -0,0 +1,8 @@
|
||||
import pandas as pd
|
||||
import requests
|
||||
|
||||
MASTER = "~/Downloads/Anthology-Master-CSV-FirstChanges.csv"
|
||||
df = pd.read_csv(MASTER)
|
||||
|
||||
for row in df.iterrows():
|
||||
print(row)
|
||||
26
Scripts/Anthology/antho_domains.py
Normal file
26
Scripts/Anthology/antho_domains.py
Normal file
@ -0,0 +1,26 @@
|
||||
import csv
|
||||
import pandas as pd
|
||||
|
||||
|
||||
def grab_vals():
|
||||
file = "/Users/normrasmussen/Downloads/antho_domains.csv"
|
||||
final_array = []
|
||||
with open(file, 'r') as file:
|
||||
reader = csv.reader(file)
|
||||
for row in reader:
|
||||
for item in row:
|
||||
if item != '':
|
||||
final_array.append(item)
|
||||
|
||||
print(len(final_array))
|
||||
final_list = list(set(final_array))
|
||||
print(len(final_list))
|
||||
|
||||
final = ["@"+domain for domain in final_list]
|
||||
# print(final)
|
||||
filecsv = pd.DataFrame(final)
|
||||
filecsv.to_csv("/Users/normrasmussen/Downloads/final_domains.csv")
|
||||
|
||||
|
||||
if __name__ == "__main__":
|
||||
grab_vals()
|
||||
4
Scripts/Anthology/anthology-parse-csv-test2.csv
Normal file
4
Scripts/Anthology/anthology-parse-csv-test2.csv
Normal file
@ -0,0 +1,4 @@
|
||||
domain, group_1, ,
|
||||
newanthology.com, Anthology 101 - (T1), Anthology 101 - (T2),
|
||||
sometest.com, Anthology 101 - (T1), Anthology 101 - (T4),
|
||||
tc.columbia.edu, Anthology 101 - (T2), ,
|
||||
|
1102
Scripts/Anthology/domains_list.py
Normal file
1102
Scripts/Anthology/domains_list.py
Normal file
File diff suppressed because it is too large
Load Diff
10
Scripts/Anthology/find_domain_names.py
Normal file
10
Scripts/Anthology/find_domain_names.py
Normal file
@ -0,0 +1,10 @@
|
||||
from requests_html import HTMLSession
|
||||
from domains_list import DOMAINS
|
||||
|
||||
for domain in DOMAINS:
|
||||
URL = f"https://{domain}"
|
||||
session = HTMLSession()
|
||||
resp = session.get(URL)
|
||||
title = resp.html.find('head > title', first=True)
|
||||
group_name = title.text.split("|")[0]
|
||||
print(group_name)
|
||||
8615
Scripts/Anthology/workato-antho-2.py
Normal file
8615
Scripts/Anthology/workato-antho-2.py
Normal file
File diff suppressed because it is too large
Load Diff
Reference in New Issue
Block a user