-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathMakefile
More file actions
63 lines (36 loc) · 1.88 KB
/
Makefile
File metadata and controls
63 lines (36 loc) · 1.88 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
.PHONY: clean all
all: correlated
clean:
rm kilgarriff_* cmudict_* correlated uncorrelated
############################################################
cmudict:
curl http://svn.code.sf.net/p/cmusphinx/code/trunk/cmudict/cmudict-0.7b > cmudict
kilgarriff:
curl http://www.kilgarriff.co.uk/BNClists/all.al.gz | gunzip > kilgarriff
# kilgarriff.num::
# curl http://www.kilgarriff.co.uk/BNClists/all.num.gz | gunzip > kilgarriff.num
############################################################
cmudict_05_no_comments: cmudict
cat cmudict | grep --text -v '^;;;' > cmudict_05_no_comments
cmudict_07_remove_bad_unicode: cmudict_05_no_comments
cat cmudict_05_no_comments | grep --text -v 'D EY2 JH AA1' > cmudict_07_remove_bad_unicode
cmudict_10_first_only: cmudict_07_remove_bad_unicode
cat cmudict_07_remove_bad_unicode | grep --text -v '^[^ ]*\([0-9]\)' > cmudict_10_first_only
cmudict_20_discard_stress: cmudict_10_first_only
cat cmudict_10_first_only | ./discard_stress.py > cmudict_20_discard_stress
cmudict_processed: cmudict_20_discard_stress
cp cmudict_20_discard_stress cmudict_processed
############################################################
kilgarriff_05_discard_fields: kilgarriff
cat kilgarriff | awk '{print $$1, $$2}' > kilgarriff_05_discard_fields
kilgarriff_07_discard_total: kilgarriff_05_discard_fields
cat kilgarriff_05_discard_fields | sed '1d' > kilgarriff_07_discard_total
kilgarriff_10_squashed: kilgarriff_07_discard_total
cat kilgarriff_07_discard_total | ./squash_kilgarriff.py > kilgarriff_10_squashed
kilgarriff_20_sorted: kilgarriff_10_squashed
cat kilgarriff_10_squashed | sort --numeric-sort --reverse > kilgarriff_20_sorted
kilgarriff_processed: kilgarriff_20_sorted
cp kilgarriff_20_sorted kilgarriff_processed
############################################################
correlated: kilgarriff_processed cmudict_processed
./make_correlated.py