-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathBYUWebAuto.py
211 lines (169 loc) · 7.81 KB
/
BYUWebAuto.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
import os
import zipfile
from datetime import datetime
from titlecase import titlecase
from tkinter import *
def GetFileName(slug): # this takes a slug and returns the filename, capitalization doesn't matter
setups = os.listdir('//Users/scot/Box/BYU Radio/Top of Mind/2020 Setup Sheets/')
setupsLower = [x.lower() for x in setups] # makes all titles in listdir lowercase for cap-free searching
fileName = str([s for s in setupsLower if slug.lower() in s])
if len(fileName) == 2:
setupSheet = "NO FILE FOUND WITH \"" + slug + "\" IN NAME"
elif fileName.count(".docx") > 1:
setupSheet = "MORE THAN ONE POSSIBLE FILE: " + fileName
else:
cleanName = setupsLower.index(fileName[2:len(fileName) - 2])
setupSheet = setups[cleanName] # returns properly capitalized filename based on index
return setupSheet
def CleanWord(fileSlug):
fileName = GetFileName(fileSlug)
doc = zipfile.ZipFile('//Users/scot/Box/BYU Radio/Top of Mind/2020 Setup Sheets/' + fileName)
content = doc.read('word/document.xml').decode(
'utf-8') # .decode() turns type bytes into string for easy manipulation
cleaned = re.sub('<(.|\n)*?>', '', content)
return cleaned
def GetHeadline(cleaned):
# get headline
headline = cleaned[cleaned.find("HEADLINE: ") + len("HEADLINE: "):cleaned.find("SEGMENT")]
return headline
def GetGuest(cleaned):
# get name and title of guest--should be reviewed for proper formatting
nameAndTitle = "Name and Title of Guest(s): "
if cleaned.find(
"Pronunciation:") != -1: # if "Pronunciation has been deleted, the string will stop at "Pre-Record:"
guest = cleaned[cleaned.find(nameAndTitle) + len(nameAndTitle):cleaned.find("Pronunciation:")]
elif cleaned.find("Pre-Record") != -1:
guest = cleaned[cleaned.find(nameAndTitle) + len(nameAndTitle):cleaned.find("Pre-Record:")]
else:
guest = cleaned[cleaned.find(nameAndTitle) + len(nameAndTitle):cleaned.find("FOR AIR:")]
return guest
def GetIntroCopy(cleaned):
# gets intro, goes until it sees "QUESTIONS:" or "OUTRO COPY", whichever comes first
indexIntroCopyLeft = ""
if cleaned.find("OUT CUE: I’m Julie Rose. ") != -1:
introCopy = "OUT CUE: I’m Julie Rose. "
indexIntroCopyLeft = cleaned.find(introCopy) + len(introCopy)
elif cleaned.find("INTRO COPY (LIVE-READ, WRITTEN-TO-SOUND). ") != -1:
introCopy = "INTRO COPY (LIVE-READ, WRITTEN-TO-SOUND). "
indexIntroCopyLeft = cleaned.find(introCopy) + len(introCopy)
elif cleaned.find("INTRO COPY (LIVE-READ, WRITTEN-TO-SOUND).") != -1:
introCopy = "INTRO COPY (LIVE-READ, WRITTEN-TO-SOUND)."
indexIntroCopyLeft = cleaned.find(introCopy) + len(introCopy)
elif cleaned.find("INTRO COPY") != -1:
introCopy = "INTRO COPY"
indexIntroCopyLeft = cleaned.find(introCopy) + len(introCopy)
intro = cleaned[indexIntroCopyLeft:len(cleaned)]
if intro.find("on the line") != -1:
intro = intro[0:intro.find("on the line")]
if intro.find("joins me now") != -1:
intro = intro[0:intro.find("joins me now")]
if intro.find("QUESTIONS:") != -1:
intro = intro[0:intro.find("QUESTIONS:")]
if intro.find("Welcome.") != -1:
intro = intro[0:intro.find("Welcome.")]
if intro.find("OUTRO COPY") != -1:
intro = intro[0:intro.find("OUTRO COPY")]
return intro
def ScrapeWord(fileSlug): # this goes into a word document and returns titlecase headline, guest info, and intro copy
cleaned = CleanWord(fileSlug)
headline = GetHeadline(cleaned)
guest = GetGuest(cleaned)
intro = GetIntroCopy(cleaned)
# if it's for Prime Cuts, this gives the original air date
if cleaned.find("PRIME CUTS") != -1: # GetFileName(fileSlug).find("PRIME CUTS") != -1: <- I might need this
forAir = cleaned[cleaned.find("FOR AIR") + len("FOR AIR: "):len(cleaned)]
origAired = "(Originally aired" + forAir[0:forAir.find("PRIME")] + ")"
else:
origAired = ""
# concatenate info, titlecase headline and guest
info = titlecase(headline) + "\n" + "Guest: " + titlecase(guest) + "\n" + intro + " " + origAired + "\n\n"
return info
def GiveEpisodeInfo(fileName): # returns titlecase headline, guest info, and intro copy from word
cleaned = CleanWord(fileName)
# get name and title of guest--should be reviewed for proper formatting
nameAndTitle = "Name and Title of Guest(s): "
if cleaned.find(
"Pronunciation:") != -1: # if "Pronunciation has been deleted, the string will stop at "Pre-Record:"
guest = cleaned[cleaned.find(nameAndTitle) + len(nameAndTitle):cleaned.find("Pronunciation:")]
else:
guest = cleaned[cleaned.find(nameAndTitle) + len(nameAndTitle):cleaned.find("Pre-Record:")]
info = guest[0:guest.find(",")] + " of " + guest[guest.find(","):len(guest)] + " on " + fileName.lower() + "."
return info
# Work below here, may need some functions above
def ListSlugs(): # TODO change this to adjust number of slugs, or don't get
slugs = [slug_entry_1.get(), slug_entry_2.get(), slug_entry_3.get(),
slug_entry_4.get(), slug_entry_5.get(), slug_entry_6.get()]
return slugs
def PrintSlugs():
slugs = ListSlugs()
j = 0
for i in slugs:
j += 1
if len(i) == 0:
Label(root, text="NO SLUG ENTERED").grid(row=j, column=3)
else:
Label(root, text=GetFileName(i)).grid(row=j, column=3)
create_txt_done.grid_forget()
def InsertTxt(webText): # this opens/creates a new .txt file, writes webText to it, closes .txt file
now = datetime.now()
today = now.strftime("%m-%d-%Y")
file = "//Users/scot/Desktop/Setups/WebsiteAuto/" + today + ".txt"
f = open(file, "w+")
f.write(webText)
f.close()
def EpInfo():
slugs = ListSlugs()
episodeInfo = ''
for i in slugs:
episodeInfo += GiveEpisodeInfo(GetFileName(i))
e = Entry(root)
e.grid(row=7, column=3)
e.insert(0, episodeInfo)
create_txt_done.grid_forget()
def CreateTxt():
slugs = ListSlugs()
text = ""
for x in slugs:
text += ScrapeWord(x)
InsertTxt(text)
create_txt_done.grid(row=8, column=1)
# print(ScrapeWord("")) you can use this for tests
root = Tk()
root.title("BYU Top of Mind Web Automated")
title = Label(root, text="BYU Web Automated", compound=CENTER)
show_name = Label(root, text="Top of Mind with Julie Rose", compound=CENTER)
slug_label_1 = Label(root, text="Enter Slug 1:")
slug_label_2 = Label(root, text="Enter Slug 2:")
slug_label_3 = Label(root, text="Enter Slug 3:")
slug_label_4 = Label(root, text="Enter Slug 4:")
slug_label_5 = Label(root, text="Enter Slug 5:")
slug_label_6 = Label(root, text="Enter Slug 6:")
slug_entry_1 = Entry(root)
slug_entry_2 = Entry(root)
slug_entry_3 = Entry(root)
slug_entry_4 = Entry(root)
slug_entry_5 = Entry(root)
slug_entry_6 = Entry(root)
get_filenames_button = Button(root, text="Check filenames", command=PrintSlugs)
create_txt = Button(root, text="Create .txt file", command=CreateTxt)
create_txt_done = Label(root, text="Done!")
get_ep_info = Button(root, text="Get Episode Info", command=EpInfo)
#TODO add a clear button to destroy the filename labels...or just clear them anytime you call Check filename
title.grid(row=0, column=0)
show_name.grid(row=0, column=1)
slug_label_1.grid(row=1, column=0)
slug_label_2.grid(row=2, column=0)
slug_label_3.grid(row=3, column=0)
slug_label_4.grid(row=4, column=0)
slug_label_5.grid(row=5, column=0)
slug_label_6.grid(row=6, column=0)
slug_entry_1.grid(row=1, column=1)
slug_entry_2.grid(row=2, column=1)
slug_entry_3.grid(row=3, column=1)
slug_entry_4.grid(row=4, column=1)
slug_entry_5.grid(row=5, column=1)
slug_entry_6.grid(row=6, column=1)
get_filenames_button.grid(row=7, column=0)
create_txt.grid(row=7, column=1)
get_ep_info.grid(row=7, column=2)
root.mainloop()