Skip to content

Commit 0a11188

Browse files
committed
untangle spaghetti
1 parent 857b8fd commit 0a11188

File tree

6 files changed

+873
-684
lines changed

6 files changed

+873
-684
lines changed

BROWSING_CATEGORIES.py

Lines changed: 188 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,188 @@
1+
# update this to include sites you want to track!
2+
BROWSING_CATEGORIES = { # update this to include sites you want to track
3+
'social_media': {
4+
'domains': [
5+
'facebook.com', 'twitter.com', 'x.com', 'instagram.com', 'reddit.com',
6+
'linkedin.com', 'tiktok.com', 'snapchat.com', 'pinterest.com',
7+
'tumblr.com', 'discord.com', 'slack.com', 'whatsapp.com', 'telegram.org',
8+
'mastodon.social', 'threads.net', 'bsky.social', 'bereal.com'
9+
],
10+
'patterns': [r'social', r'/comments/', r'/status/', r'/post/'],
11+
'subcategories': {
12+
'professional': ['linkedin.com', 'slack.com'],
13+
'messaging': ['whatsapp.com', 'telegram.org', 'discord.com'],
14+
'content_sharing': ['instagram.com', 'tiktok.com', 'pinterest.com']
15+
}
16+
},
17+
18+
'entertainment': {
19+
'domains': [
20+
'youtube.com', 'netflix.com', 'spotify.com', 'twitch.tv', 'hulu.com',
21+
'disneyplus.com', 'hbomax.com', 'primevideo.com', 'vimeo.com',
22+
'soundcloud.com', 'pandora.com', 'applemusic.com', 'deezer.com',
23+
'crunchyroll.com', 'funimation.com', 'steam.com', 'epicgames.com',
24+
'ign.com', 'gamespot.com', 'kotaku.com', 'polygon.com'
25+
],
26+
'patterns': [r'/watch', r'/video/', r'/episode/', r'/game/', r'wiki\.fandom\.com'],
27+
'subcategories': {
28+
'video': ['youtube.com', 'netflix.com', 'twitch.tv'],
29+
'music': ['spotify.com', 'soundcloud.com', 'pandora.com'],
30+
'gaming': ['steam.com', 'epicgames.com', 'ign.com', r'\.fandom\.com']
31+
}
32+
},
33+
34+
'development': {
35+
'domains': [
36+
'stackoverflow.com', 'github.com', 'gitlab.com', 'bitbucket.org',
37+
'developer.mozilla.org', 'w3schools.com', 'css-tricks.com',
38+
'dev.to', 'hashnode.dev', 'codesandbox.io', 'codepen.io',
39+
'jsfiddle.net', 'replit.com', 'vercel.com', 'netlify.com',
40+
'npmjs.com', 'pypi.org', 'crates.io', 'packagist.org',
41+
'docker.com', 'kubernetes.io', 'terraform.io'
42+
],
43+
'patterns': [
44+
r'docs\..*\.(?:com|org|io)', r'.*\.readthedocs\.io', r'/documentation/',
45+
r'/api/', r'/reference/', r'github\.com/.*/(?:issues|pull|wiki)',
46+
r'stackoverflow\.com/questions/'
47+
],
48+
'subcategories': {
49+
'q&a': ['stackoverflow.com', 'dev.to'],
50+
'repositories': ['github.com', 'gitlab.com', 'bitbucket.org'],
51+
'documentation': [r'docs\.', r'\.readthedocs\.io', 'developer.mozilla.org'],
52+
'tools': ['codesandbox.io', 'codepen.io', 'replit.com']
53+
}
54+
},
55+
56+
'learning': {
57+
'domains': [
58+
'coursera.org', 'udemy.com', 'edx.org', 'khanacademy.org',
59+
'udacity.com', 'pluralsight.com', 'lynda.com', 'skillshare.com',
60+
'masterclass.com', 'brilliant.org', 'datacamp.com', 'codecademy.com',
61+
'freecodecamp.org', 'mit.edu', 'stanford.edu', 'harvard.edu',
62+
'arxiv.org', 'scholar.google.com', 'jstor.org', 'pubmed.ncbi.nlm.nih.gov',
63+
'wikipedia.org', 'wikihow.com', 'instructables.com'
64+
],
65+
'patterns': [
66+
r'/course/', r'/tutorial/', r'/learn/', r'/guide/', r'/how-to',
67+
r'\.edu/', r'/research/', r'/paper/', r'/study/'
68+
],
69+
'subcategories': {
70+
'moocs': ['coursera.org', 'udemy.com', 'edx.org'],
71+
'technical': ['freecodecamp.org', 'codecademy.com', 'datacamp.com'],
72+
'academic': ['arxiv.org', 'scholar.google.com', 'jstor.org', r'\.edu/'],
73+
'practical': ['wikihow.com', 'instructables.com']
74+
}
75+
},
76+
77+
'productivity': {
78+
'domains': [
79+
'notion.so', 'trello.com', 'asana.com', 'todoist.com', 'monday.com',
80+
'clickup.com', 'airtable.com', 'basecamp.com', 'jira.atlassian.com',
81+
'confluence.atlassian.com', 'evernote.com', 'onenote.com', 'obsidian.md',
82+
'roamresearch.com', 'workflowy.com', 'calendar.google.com', 'outlook.com',
83+
'zoom.us', 'meet.google.com', 'teams.microsoft.com', 'calendly.com'
84+
],
85+
'patterns': [r'/calendar/', r'/tasks/', r'/projects/', r'/workspace/'],
86+
'subcategories': {
87+
'project_management': ['trello.com', 'asana.com', 'jira.atlassian.com'],
88+
'notes': ['notion.so', 'evernote.com', 'obsidian.md'],
89+
'communication': ['zoom.us', 'meet.google.com', 'teams.microsoft.com']
90+
}
91+
},
92+
93+
'news': {
94+
'domains': [
95+
'nytimes.com', 'washingtonpost.com', 'wsj.com', 'ft.com', 'economist.com',
96+
'bbc.com', 'cnn.com', 'reuters.com', 'apnews.com', 'npr.org',
97+
'theguardian.com', 'foxnews.com', 'nbcnews.com', 'abcnews.go.com',
98+
'usatoday.com', 'politico.com', 'axios.com', 'bloomberg.com',
99+
'techcrunch.com', 'theverge.com', 'arstechnica.com', 'wired.com',
100+
'hackernews.com', 'news.ycombinator.com', 'lobste.rs', 'slashdot.org'
101+
],
102+
'patterns': [r'/article/', r'/story/', r'/news/', r'/\d{4}/\d{2}/\d{2}/'],
103+
'subcategories': {
104+
'mainstream': ['nytimes.com', 'bbc.com', 'cnn.com'],
105+
'tech': ['techcrunch.com', 'theverge.com', 'arstechnica.com'],
106+
'aggregators': ['news.ycombinator.com', 'reddit.com/r/news']
107+
}
108+
},
109+
110+
'shopping': {
111+
'domains': [
112+
'amazon.com', 'ebay.com', 'etsy.com', 'alibaba.com', 'walmart.com',
113+
'target.com', 'bestbuy.com', 'homedepot.com', 'lowes.com', 'ikea.com',
114+
'wayfair.com', 'shopify.com', 'wish.com', 'costco.com', 'sephora.com',
115+
'ulta.com', 'nike.com', 'adidas.com', 'apple.com', 'samsung.com'
116+
],
117+
'patterns': [r'/product/', r'/cart/', r'/checkout/', r'/shop/', r'/store/'],
118+
'subcategories': {
119+
'marketplace': ['amazon.com', 'ebay.com', 'etsy.com'],
120+
'retail': ['walmart.com', 'target.com', 'costco.com'],
121+
'specialty': ['sephora.com', 'nike.com', 'apple.com']
122+
}
123+
},
124+
125+
'finance': {
126+
'domains': [
127+
'chase.com', 'bankofamerica.com', 'wellsfargo.com', 'citi.com',
128+
'paypal.com', 'venmo.com', 'cashapp.com', 'zelle.com', 'wise.com',
129+
'coinbase.com', 'binance.com', 'kraken.com', 'robinhood.com',
130+
'etrade.com', 'fidelity.com', 'vanguard.com', 'schwab.com',
131+
'mint.com', 'ynab.com', 'personalcapital.com', 'creditkarma.com'
132+
],
133+
'patterns': [r'/banking/', r'/wallet/', r'/account/', r'/trading/'],
134+
'subcategories': {
135+
'banking': ['chase.com', 'bankofamerica.com', 'wellsfargo.com'],
136+
'payments': ['paypal.com', 'venmo.com', 'cashapp.com'],
137+
'investing': ['robinhood.com', 'fidelity.com', 'vanguard.com'],
138+
'crypto': ['coinbase.com', 'binance.com', 'kraken.com']
139+
}
140+
},
141+
142+
'health': {
143+
'domains': [
144+
'webmd.com', 'mayoclinic.org', 'healthline.com', 'medlineplus.gov',
145+
'nih.gov', 'cdc.gov', 'who.int', 'drugs.com', 'rxlist.com',
146+
'myfitnesspal.com', 'fitbit.com', 'strava.com', 'headspace.com',
147+
'calm.com', 'betterhelp.com', 'talkspace.com', 'zocdoc.com'
148+
],
149+
'patterns': [r'/health/', r'/medical/', r'/symptoms/', r'/conditions/'],
150+
'subcategories': {
151+
'medical_info': ['webmd.com', 'mayoclinic.org', 'healthline.com'],
152+
'fitness': ['myfitnesspal.com', 'fitbit.com', 'strava.com'],
153+
'mental_health': ['headspace.com', 'calm.com', 'betterhelp.com']
154+
}
155+
},
156+
157+
'reference': {
158+
'domains': [
159+
'google.com', 'bing.com', 'duckduckgo.com', 'yandex.com', 'baidu.com',
160+
'dictionary.com', 'thesaurus.com', 'merriam-webster.com', 'oxforddictionaries.com',
161+
'translate.google.com', 'deepl.com', 'wolframalpha.com', 'archive.org',
162+
'maps.google.com', 'openstreetmap.org', 'waze.com', 'weather.com',
163+
'timeanddate.com', 'xe.com', 'calculator.net'
164+
],
165+
'patterns': [r'/search', r'/define/', r'/translate/', r'/maps/', r'/directions/'],
166+
'subcategories': {
167+
'search': ['google.com', 'bing.com', 'duckduckgo.com'],
168+
'language': ['dictionary.com', 'translate.google.com', 'deepl.com'],
169+
'utilities': ['maps.google.com', 'weather.com', 'xe.com']
170+
}
171+
},
172+
173+
'professional': {
174+
'domains': [
175+
'salesforce.com', 'hubspot.com', 'zendesk.com', 'intercom.com',
176+
'mailchimp.com', 'constantcontact.com', 'hootsuite.com', 'buffer.com',
177+
'canva.com', 'figma.com', 'adobe.com', 'sketch.com', 'miro.com',
178+
'tableau.com', 'powerbi.microsoft.com', 'datastudio.google.com'
179+
],
180+
'patterns': [r'/dashboard/', r'/analytics/', r'/reports/', r'/design/'],
181+
'subcategories': {
182+
'crm': ['salesforce.com', 'hubspot.com', 'zendesk.com'],
183+
'marketing': ['mailchimp.com', 'hootsuite.com', 'buffer.com'],
184+
'design': ['canva.com', 'figma.com', 'adobe.com'],
185+
'analytics': ['tableau.com', 'powerbi.microsoft.com']
186+
}
187+
}
188+
}

0 commit comments

Comments
 (0)