-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathchomsky_text.txt
123 lines (115 loc) · 5.46 KB
/
chomsky_text.txt
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
(defq *starts* [
"To characterize a linguistic level L,"
"On the other hand,"
"This suggests that"
"It appears that"
"Furthermore,"
"We will bring evidence in favor of the following thesis: "
"To provide a constituent structure for T(Z,K),"
"From C1, it follows that"
"For any transformation which is sufficiently diversified in application to be of any interest,"
"Analogously,"
"Clearly,"
"Note that"
"Of course,"
"Suppose, for instance, that"
"Thus"
"With this clarification,"
"Conversely,"
"We have already seen that"
"By combining adjunctions and certain deformations,"
"I suggested that these results would follow from the assumption that"
"If the position of the trace in (99c) were only relatively inaccessible to movement,"
"However, this assumption is not correct, since"
"Comparing these examples with their parasitic gap counterparts in (96) and (97), we see that"
"In the discussion of resumptive pronouns following (81),"
"So far,"
"Nevertheless,"
"For one thing,"
"Summarizing, then, we assume that"
"A consequence of the approach just outlined is that"
"Presumably,"
"On our assumptions,"
"It may be, then, that"
"It must be emphasized, once again, that"
"Let us continue to suppose that"
"Notice, incidentally, that"
])
(defq *subjects* [
"the notion of level of grammaticalness"
"a case of semigrammaticalness of a different sort"
"most of the methodological work in modern linguistics"
"a subset of English sentences interesting on quite independent grounds"
"the natural general principle that will subsume this case"
"an important property of these three types of EC"
"any associated supporting element"
"the appearance of parasitic gaps in domains relatively inaccessible to ordinary extraction"
"the speaker-hearer's linguistic intuition"
"the descriptive power of the base component"
"the earlier discussion of deviance"
"this analysis of a formative as a pair of sets of features"
"this selectionally introduced contextual feature"
"a descriptively adequate grammar"
"the fundamental error of regarding functional notions as categorial"
"relational information"
"the systematic use of complex symbols"
"the theory of syntactic features developed earlier"
])
(defq *verbs* [
"can be defined in such a way as to impose"
"delimits"
"suffices to account for"
"cannot be arbitrary in"
"is not subject to"
"does not readily tolerate"
"raises serious doubts about"
"is not quite equivalent to"
"does not affect the structure of"
"may remedy and, at the same time, eliminate"
"is not to be considered in determining"
"is to be regarded as"
"is unspecified with respect to"
"is, apparently, determined by"
"is necessary to impose an interpretation on"
"appears to correlate rather closely with"
"is rather different from"
])
(defq *objects* [
"problems of phonemic and morphological analysis."
"a corpus of utterance tokens upon which conformity has been defined by the paired utterance test."
"the traditional practice of grammarians."
"the levels of acceptability from fairly high (e.g. (99a)) to virtual gibberish (e.g. (98d))."
"a stipulation to place the constructions into these various categories."
"a descriptive fact."
"a parasitic gap construction."
"the extended c-command discussed in connection with (34)."
"the ultimate standard that determines the accuracy of any proposed grammar."
"the system of base rules exclusive of the lexicon."
"irrelevant intervening contexts in selectional rules."
"nondistinctness in the sense of distinctive feature theory."
"a general convention regarding the forms of the grammar."
"an abstract underlying order."
"an important distinction in language use."
"the requirement that branching is not tolerated within the dominance scope of a complex symbol."
"the strong generative capacity of the theory."
])
(defn swap-pos (l a b) (c (nth l a)) (do (set-nth l a (nth l b)) (set-nth l b c)))
(defn distinct-random-n (l n) (random-pos nil) (i (1- (len l)))
(repeat n (do (setq random-pos (randint i)) (swap-pos l i random-pos) (-- i) (pop l)))
)
(defn wrap (text max-chars-per-line)
(words (split text ' ')) (lines [[]]) (chars-in-line -1) (do
(each (fn (word) (let
(new-chars-in-line (+ chars-in-line (len word) 1))
(overflow (< max-chars-per-line new-chars-in-line)) (if overflow
(do (push lines [word]) (setq chars-in-line (len word)))
(do (push (last lines) word) (setq chars-in-line new-chars-in-line)))
)) words)
(join (map (fn (line) (join line ' ')) lines) '\n'))
)
(defn chomsky-text (n) (wrap (join (map (fn (sentence) (join sentence ' '))
((apply zip) (map (fn (l) (distinct-random-n l n))
[*starts* *subjects* *verbs* *objects*]
))
) ' ') 80))
(puts (chomsky-text 5))