-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathemail_extractor.py
More file actions
147 lines (106 loc) · 4.49 KB
/
email_extractor.py
File metadata and controls
147 lines (106 loc) · 4.49 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
import tkinter as tk
from tkinter import *
from tkinter import ttk
from tkinter.scrolledtext import *
import re
email_regex = re.compile(r"[\w\.-]+@[\w\.-]+")
phone_num_regex = re.compile(r'\d\d\d.\d\d\d.\d\d\d\d')
# url_regex = re.compile(r"https?://(www\.)?(\w+)(\.\w+)")
url_regex_https = re.compile(r"https?://www\.?\w+\.\w+")
url_regex = re.compile(r"http?://www\.?\w+\.\w+")
window = Tk()
window.title("Email & Phone Extractor")
window.geometry('700x500')
tab_control = ttk.Notebook(window)
tab1 = ttk.Frame(tab_control)
tab2 = ttk.Frame(tab_control)
tab3 = ttk.Frame(tab_control)
tab_control.add(tab1,text="Home")
tab_control.add(tab2,text="Url/Links Extract")
tab_control.add(tab3,text='About')
tab_control.pack(expand=1,fill='both')
label1 = Label(tab1, text= 'Email & Phone Number Extractor',padx=5, pady=5)
label1.grid(column=0, row=0)
label2 = Label(tab2, text= 'Url Extractor',padx=5, pady=5)
label2.grid(column=0, row=0)
label3 = Label(tab3, text= 'About',padx=5, pady=5)
label3.grid(column=0, row=0)
# Clear entry widget
def clear_text():
entry1.delete('1.0',END)
def clear_text_url():
entry.delete('1.0',END)
def clear_display_result():
tab1_display.delete('1.0',END)
def clear_display_result_url():
tab2_display.delete('1.0',END)
def extract_email():
raw_text = str(entry1.get('1.0',tk.END))
final_extract = email_regex.findall(raw_text)
num_of_results = len(final_extract)
result = '\nNumber of Emails:{},\nEmails:{}'.format(num_of_results,final_extract)
tab1_display.insert(tk.END,result)
def extract_phonenumbers():
raw_text = str(entry1.get('1.0',tk.END))
final_extract = phone_num_regex.findall(raw_text)
num_of_results = len(final_extract)
result = '\nPhone Number Count:{},\nPhone Numbers:{}'.format(num_of_results,final_extract)
tab1_display.insert(tk.END,result)
def extract_http():
raw_text = str(entry.get('1.0',tk.END))
final_extract = url_regex.findall(raw_text)
num_of_results = len(final_extract)
result = '\nURL Count:{},\nURL/HTTP:{}'.format(num_of_results,final_extract)
tab2_display.insert(tk.END,result)
def extract_https():
raw_text = str(entry.get('1.0',tk.END))
final_extract = url_regex_https.findall(raw_text)
num_of_results = len(final_extract)
result = '\nURL Count:{},\nURL/HTTP:{}'.format(num_of_results,final_extract)
tab2_display.insert(tk.END,result)
# Main Page
l1=Label(tab1,text="Enter Text To Extract")
l1.grid(row=1,column=0)
entry1=ScrolledText(tab1,height=10)
entry1.grid(row=2,column=0,columnspan=2,padx=5,pady=5)
# BUTTONS
button_1=Button(tab1,text="Reset",command=clear_text, width=10,bg='#03A9F4',fg='#fff')
button_1.grid(row=4,column=0,padx=10,pady=10)
button_2=Button(tab1,text="Email",command=extract_email, width=10,bg='red',fg='#fff')
button_2.grid(row=4,column=1,padx=10,pady=10)
button_2=Button(tab1,text="Phone",command=extract_phonenumbers, width=10,bg='green',fg='#fff')
button_2.grid(row=5,column=1,padx=10,pady=10)
button_3=Button(tab1,text="Clear Result", command=clear_display_result,width=10,bg='#03A9F4',fg='#fff')
button_3.grid(row=5,column=0,padx=10,pady=10)
# variable = StringVar()
# variable.set("URL/HTTP")
# choice_button = OptionMenu(tab1,variable,"URL/HTTP","URL/HTTPS")
# choice_button.grid(row=6,column=1)
# Display Screen For Result
tab1_display = ScrolledText(tab1,height=10)
tab1_display.grid(row=7,column=0, columnspan=3,padx=5,pady=5)
# URL Page Page
l1=Label(tab2,text="Enter Text To Extract Links")
l1.grid(row=1,column=0)
entry=ScrolledText(tab2,height=10)
entry.grid(row=2,column=0,columnspan=2,padx=5,pady=5)
# BUTTONS
button1=Button(tab2,text="Reset",command=clear_text_url, width=10,bg='#03A9F4',fg='#fff')
button1.grid(row=4,column=0,padx=10,pady=10)
button2=Button(tab2,text="Extract HTTP",command=extract_http, width=10,bg='red',fg='#fff')
button2.grid(row=4,column=1,padx=10,pady=10)
button2=Button(tab2,text="Extract HTTPS",command=extract_https, width=10,bg='blue',fg='#fff')
button2.grid(row=5,column=1,padx=10,pady=10)
button3=Button(tab2,text="Clear Result", command=clear_display_result_url,width=10,bg='#03A9F4',fg='#fff')
button3.grid(row=5,column=0,padx=10,pady=10)
# variable = StringVar()
# variable.set("URL/HTTP")
# choice_button = OptionMenu(tab1,variable,"URL/HTTP","URL/HTTPS")
# choice_button.grid(row=6,column=1)
# Display Screen For Result
tab2_display = ScrolledText(tab2,height=10)
tab2_display.grid(row=7,column=0, columnspan=3,padx=5,pady=5)
# About TAB
about_label = Label(tab3,text="Email Extractor V.0.0.1 \n Jesus saves @JCharisTech",pady=5,padx=5)
about_label.grid(column=0,row=1)
window.mainloop()